{"id":"https://openalex.org/W7160254590","doi":"https://doi.org/10.1109/wacv61042.2026.00403","title":"TalkingHeadBench: A Multi-Modal Benchmark &amp; Analysis of Talking-Head DeepFake Detection","display_name":"TalkingHeadBench: A Multi-Modal Benchmark &amp; Analysis of Talking-Head DeepFake Detection","publication_year":2026,"publication_date":"2026-03-06","ids":{"openalex":"https://openalex.org/W7160254590","doi":"https://doi.org/10.1109/wacv61042.2026.00403"},"language":null,"primary_location":{"id":"doi:10.1109/wacv61042.2026.00403","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv61042.2026.00403","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135403814","display_name":"Xinqi Xiong","orcid":null},"institutions":[{"id":"https://openalex.org/I114027177","display_name":"University of North Carolina at Chapel Hill","ror":"https://ror.org/0130frc33","country_code":"US","type":"education","lineage":["https://openalex.org/I114027177"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xinqi Xiong","raw_affiliation_strings":["University of North Carolina at Chapel Hill"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Carolina at Chapel Hill","institution_ids":["https://openalex.org/I114027177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102585514","display_name":"Prakrut Patel","orcid":null},"institutions":[{"id":"https://openalex.org/I114027177","display_name":"University of North Carolina at Chapel Hill","ror":"https://ror.org/0130frc33","country_code":"US","type":"education","lineage":["https://openalex.org/I114027177"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Prakrut Patel","raw_affiliation_strings":["University of North Carolina at Chapel Hill"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Carolina at Chapel Hill","institution_ids":["https://openalex.org/I114027177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135394706","display_name":"Qingyuan Fan","orcid":null},"institutions":[{"id":"https://openalex.org/I114027177","display_name":"University of North Carolina at Chapel Hill","ror":"https://ror.org/0130frc33","country_code":"US","type":"education","lineage":["https://openalex.org/I114027177"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qingyuan Fan","raw_affiliation_strings":["University of North Carolina at Chapel Hill"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Carolina at Chapel Hill","institution_ids":["https://openalex.org/I114027177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135297718","display_name":"Amisha Wadhwa","orcid":null},"institutions":[{"id":"https://openalex.org/I114027177","display_name":"University of North Carolina at Chapel Hill","ror":"https://ror.org/0130frc33","country_code":"US","type":"education","lineage":["https://openalex.org/I114027177"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amisha Wadhwa","raw_affiliation_strings":["University of North Carolina at Chapel Hill"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Carolina at Chapel Hill","institution_ids":["https://openalex.org/I114027177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135348024","display_name":"Sarathy Selvam","orcid":null},"institutions":[{"id":"https://openalex.org/I114027177","display_name":"University of North Carolina at Chapel Hill","ror":"https://ror.org/0130frc33","country_code":"US","type":"education","lineage":["https://openalex.org/I114027177"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sarathy Selvam","raw_affiliation_strings":["University of North Carolina at Chapel Hill"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Carolina at Chapel Hill","institution_ids":["https://openalex.org/I114027177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101545682","display_name":"Xiao Guo","orcid":"https://orcid.org/0000-0002-5440-6175"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiao Guo","raw_affiliation_strings":["Michigan State University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Michigan State University","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006095883","display_name":"Luchao Qi","orcid":"https://orcid.org/0000-0002-3192-4746"},"institutions":[{"id":"https://openalex.org/I114027177","display_name":"University of North Carolina at Chapel Hill","ror":"https://ror.org/0130frc33","country_code":"US","type":"education","lineage":["https://openalex.org/I114027177"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Luchao Qi","raw_affiliation_strings":["University of North Carolina at Chapel Hill"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Carolina at Chapel Hill","institution_ids":["https://openalex.org/I114027177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135403777","display_name":"Xiaoming Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaoming Liu","raw_affiliation_strings":["Michigan State University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Michigan State University","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102635961","display_name":"Roni Sengupta","orcid":"https://orcid.org/0000-0001-5914-3469"},"institutions":[{"id":"https://openalex.org/I114027177","display_name":"University of North Carolina at Chapel Hill","ror":"https://ror.org/0130frc33","country_code":"US","type":"education","lineage":["https://openalex.org/I114027177"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Roni Sengupta","raw_affiliation_strings":["University of North Carolina at Chapel Hill"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Carolina at Chapel Hill","institution_ids":["https://openalex.org/I114027177"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5135403814"],"corresponding_institution_ids":["https://openalex.org/I114027177"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.92723128,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4139","last_page":"4149"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.46230000257492065,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.46230000257492065,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.09080000221729279,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.0746999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.46889999508857727},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.31220000982284546},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.29179999232292175},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.287200003862381}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5752999782562256},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.46889999508857727},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3691999912261963},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.35030001401901245},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3391999900341034},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.29179999232292175},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.287200003862381},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27810001373291016},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/wacv61042.2026.00403","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv61042.2026.00403","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W2616247523","https://openalex.org/W2871667416","https://openalex.org/W2962770929","https://openalex.org/W2982058372","https://openalex.org/W2984700035","https://openalex.org/W3017300133","https://openalex.org/W3092709185","https://openalex.org/W4247405818","https://openalex.org/W4312722235","https://openalex.org/W4319299873","https://openalex.org/W4319978495","https://openalex.org/W4367316141","https://openalex.org/W4386071484","https://openalex.org/W4386075856","https://openalex.org/W4386075957","https://openalex.org/W4386102876","https://openalex.org/W4390872774","https://openalex.org/W4390874333","https://openalex.org/W4391931465","https://openalex.org/W4394625274","https://openalex.org/W4399138486","https://openalex.org/W4399431188","https://openalex.org/W4399980772","https://openalex.org/W4400401421","https://openalex.org/W4400573497","https://openalex.org/W4402715910","https://openalex.org/W4402727609","https://openalex.org/W4402728455","https://openalex.org/W4402772264","https://openalex.org/W4403791323","https://openalex.org/W4404199615","https://openalex.org/W4404891145","https://openalex.org/W4405229107","https://openalex.org/W4405662451","https://openalex.org/W4406804129","https://openalex.org/W4409262373","https://openalex.org/W4411241923","https://openalex.org/W4412673785","https://openalex.org/W4413147005","https://openalex.org/W4413822471","https://openalex.org/W4415796454"],"related_works":[],"abstract_inverted_index":{"The":[0,88],"rapid":[1],"advancement":[2],"of":[3,16,101,174,196],"talking-head":[4,39,71],"deepfake":[5,38],"generation":[6],"fueled":[7],"by":[8],"advanced":[9],"generative":[10,199],"models":[11,135,192],"has":[12],"elevated":[13],"the":[14,194],"realism":[15],"synthetic":[17],"videos":[18,72,105],"to":[19,42,66,103,121,183],"a":[20,62,110,145,165],"level":[21],"that":[22,97,134],"poses":[23],"substantial":[24],"risks":[25],"in":[26,193],"domains":[27],"such":[28],"as":[29],"media,":[30],"politics,":[31],"and":[32,50,57,126,189,205,211],"finance.":[33],"However,":[34],"current":[35],"benchmarks":[36],"for":[37,85,114],"detection":[40,191],"fail":[41],"reflect":[43],"this":[44,68],"progress,":[45],"relying":[46],"on":[47,92,139,149,170],"outdated":[48],"generators":[49,82],"offering":[51],"limited":[52],"insight":[53],"into":[54],"model":[55],"robustness":[56],"generalization.":[58,87],"We":[59,201],"introduce":[60],"TalkingHeadBench,":[61],"new":[63],"benchmark":[64,181,204],"designed":[65,120],"address":[67],"gap,":[69],"featuring":[70],"from":[73],"six":[74],"modern":[75],"generators,":[76],"with":[77,106,136,207],"an":[78,93],"additional":[79],"two":[80],"emerging":[81],"used":[83],"exclusively":[84],"testing":[86],"dataset":[89,206],"is":[90],"built":[91],"expert-led":[94],"curation":[95],"process":[96],"filters":[98],"over":[99],"60%":[100],"samples":[102],"remove":[104],"noticeable":[107],"artifacts,":[108],"presenting":[109],"more":[111,187],"difficult":[112],"challenge":[113],"detectors.":[115],"Our":[116,180],"evaluation":[117],"protocols":[118,212],"are":[119],"measure":[122],"generalization":[123],"across":[124],"identity":[125],"generator":[127],"shifts.":[128],"Benchmarking":[129],"seven":[130],"state-of-the-art":[131],"detectors":[132,168],"reveals":[133],"high":[137],"accuracy":[138],"older":[140],"datasets":[141],"like":[142],"FaceForensics++":[143],"show":[144],"significant":[146],"performance":[147],"drop":[148],"our":[150,203],"curated":[151],"data,":[152],"particularly":[153],"at":[154,213],"strict":[155],"false":[156],"positive":[157],"rates":[158],"(e.g.,":[159],"TPR@FPR=0.1%).":[160],"In":[161],"addition,":[162],"we":[163],"identify":[164],"trend":[166],"where":[167],"focus":[169],"background":[171],"cues":[172],"instead":[173],"facial":[175],"features":[176],"using":[177],"Grad-CAM":[178],"visualization.":[179],"aims":[182],"accelerate":[184],"research":[185],"towards":[186],"robust":[188],"generalizable":[190],"face":[195],"rapidly":[197],"evolving":[198],"techniques.":[200],"release":[202],"all":[208],"data":[209],"splits":[210],"https://anaxqx.github.io/talkingheadbench.github.io.":[214]},"counts_by_year":[],"updated_date":"2026-05-07T06:04:25.777469","created_date":"2026-05-06T00:00:00"}
