{"id":"https://openalex.org/W4413018187","doi":"https://doi.org/10.1109/fg61629.2025.11099168","title":"Dynamic Visual Speaking Patterns: You Are the Way You Speak","display_name":"Dynamic Visual Speaking Patterns: You Are the Way You Speak","publication_year":2025,"publication_date":"2025-05-26","ids":{"openalex":"https://openalex.org/W4413018187","doi":"https://doi.org/10.1109/fg61629.2025.11099168"},"language":"en","primary_location":{"id":"doi:10.1109/fg61629.2025.11099168","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fg61629.2025.11099168","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 19th International Conference on Automatic Face and Gesture Recognition (FG)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072269410","display_name":"Sihui Luo","orcid":"https://orcid.org/0000-0003-2822-0446"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Songtao Luo","raw_affiliation_strings":["Institute of Computing Technology CAS,Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology CAS,Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS),Beijing,China","institution_ids":["https://openalex.org/I4210090176"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020086523","display_name":"Shuang Yang","orcid":"https://orcid.org/0000-0003-1133-384X"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuang Yang","raw_affiliation_strings":["Institute of Computing Technology CAS,Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology CAS,Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS),Beijing,China","institution_ids":["https://openalex.org/I4210090176"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050297728","display_name":"Shiguang Shan","orcid":"https://orcid.org/0000-0002-8348-392X"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiguang Shan","raw_affiliation_strings":["Institute of Computing Technology CAS,Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology CAS,Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS),Beijing,China","institution_ids":["https://openalex.org/I4210090176"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111681970","display_name":"Xilin Chen","orcid":"https://orcid.org/0009-0006-0485-0127"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xilin Chen","raw_affiliation_strings":["Institute of Computing Technology CAS,Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS),Beijing,China"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology CAS,Key Laboratory of Intelligent Information Processing of Chinese Academy of Sciences (CAS),Beijing,China","institution_ids":["https://openalex.org/I4210090176"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5072269410"],"corresponding_institution_ids":["https://openalex.org/I4210090176"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.11308058,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.09399999678134918,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.09399999678134918,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7064001560211182},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3511192202568054},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32489293813705444}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7064001560211182},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3511192202568054},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32489293813705444}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/fg61629.2025.11099168","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fg61629.2025.11099168","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 19th International Conference on Automatic Face and Gesture Recognition (FG)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":63,"referenced_works":["https://openalex.org/W2096733369","https://openalex.org/W2194775991","https://openalex.org/W2301937176","https://openalex.org/W2366739890","https://openalex.org/W2520774990","https://openalex.org/W2551624499","https://openalex.org/W2808631503","https://openalex.org/W2884460600","https://openalex.org/W2891145043","https://openalex.org/W2902299888","https://openalex.org/W2914447220","https://openalex.org/W2949007385","https://openalex.org/W2963767194","https://openalex.org/W2963767627","https://openalex.org/W2969985801","https://openalex.org/W2981767644","https://openalex.org/W2982058372","https://openalex.org/W2984700035","https://openalex.org/W3007419529","https://openalex.org/W3015734344","https://openalex.org/W3034241236","https://openalex.org/W3034521057","https://openalex.org/W3034552680","https://openalex.org/W3034713808","https://openalex.org/W3035067471","https://openalex.org/W3035364348","https://openalex.org/W3036235590","https://openalex.org/W3092709185","https://openalex.org/W3093010840","https://openalex.org/W3093077034","https://openalex.org/W3097741049","https://openalex.org/W3109224353","https://openalex.org/W3109225549","https://openalex.org/W3130626676","https://openalex.org/W3143332912","https://openalex.org/W3163527109","https://openalex.org/W3175342695","https://openalex.org/W3186090335","https://openalex.org/W3214738836","https://openalex.org/W4214691743","https://openalex.org/W4220739185","https://openalex.org/W4221145616","https://openalex.org/W4229507706","https://openalex.org/W4281727803","https://openalex.org/W4281779270","https://openalex.org/W4312992915","https://openalex.org/W4321231565","https://openalex.org/W4366308854","https://openalex.org/W4375868968","https://openalex.org/W4386066256","https://openalex.org/W4386072021","https://openalex.org/W4386075501","https://openalex.org/W4387967909","https://openalex.org/W4388081272","https://openalex.org/W4402130146","https://openalex.org/W4407837644","https://openalex.org/W6637618735","https://openalex.org/W6639480849","https://openalex.org/W6725923168","https://openalex.org/W6736057607","https://openalex.org/W6748181857","https://openalex.org/W6762480454","https://openalex.org/W6797657831"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"In":[0,32],"this":[1],"paper,":[2],"we":[3,41,90],"present":[4],"a":[5,169,197,231],"new":[6,232],"perspective":[7],"on":[8,28,51,179,186,196],"analyzing":[9],"the":[10,68,73,82,110,133,143,148,152,176,225,259],"unique":[11],"visual":[12,38,227],"patterns":[13,118,127,228],"specific":[14],"to":[15,70,96,124,151,174,184,230],"each":[16],"speaker":[17,23,59,75,98,199,212,256,265],"in":[18,77,84,211,220,235,243,267],"talking":[19,236],"head":[20,237],"videos.":[21,79,272],"Traditional":[22],"recognition":[24,60,99,200,213,266],"methods":[25],"primarily":[26],"rely":[27],"static":[29,112,160,180,255],"facial":[30,113],"appearance.":[31],"contrast,":[33],"our":[34,54,192,206,250],"method":[35,207],"emphasizes":[36],"dynamic":[37,52,117,126,162,187,226],"patterns,":[39,53],"which":[40],"denote":[42],"as":[43],"Dynamic":[44],"Visual":[45],"speaking":[46],"Patterns":[47],"(DVPs).":[48],"By":[49],"concentrating":[50],"approach":[55],"not":[56,208],"only":[57,209],"facilitates":[58],"but":[61,115,215],"also":[62,216],"inherently":[63,217],"resists":[64,218],"fake":[65],"samples,":[66],"with":[67],"potential":[69,260],"accurately":[71],"identify":[72],"original":[74,111],"even":[76],"manipulated":[78,271],"To":[80],"guide":[81],"model":[83,121],"learning":[85],"DVPs":[86,252,262],"beyond":[87],"superficial":[88],"appearance,":[89],"introduce":[91,105],"three":[92],"seamlessly":[93],"integrable":[94],"improvements":[95],"existing":[97],"works:":[100],"(1)":[101],"Input":[102],"level:":[103,140],"We":[104,141,167,189],"negative":[106],"samples":[107],"that":[108,205],"retain":[109],"features":[114],"distort":[116],"intentionally.":[119],"The":[120,247],"then":[122],"learns":[123],"distinguish":[125],"across":[128],"different":[129],"speakers":[130],"effectively":[131],"With":[132],"strategy":[134],"of":[135,249,261],"contrastive":[136],"learning.":[137],"(2)":[138],"Feature":[139],"convert":[142],"input":[144],"video":[145,222,238],"frames":[146],"from":[147],"spatio-temporal":[149],"domain":[150],"frequencytemporal":[153],"domain,":[154],"facilitating":[155],"an":[156],"easy":[157],"distinction":[158],"between":[159],"and":[161,270],"patterns.":[163,188],"(3)":[164],"Learning":[165],"strategy:":[166],"incorporate":[168],"Gradient":[170],"Reversal":[171],"Layer":[172],"(GRL)":[173],"mitigate":[175],"model\u2019s":[177],"reliance":[178],"features,":[181],"forcing":[182],"it":[183],"focus":[185],"finally":[190],"validate":[191],"work":[193],"comprehensively":[194],"based":[195],"simple":[198],"framework.":[201],"Experimental":[202],"results":[203],"show":[204],"excels":[210],"tasks":[214],"manipulation":[219],"forged":[221,244],"samples.":[223],"Moreover,":[224],"lead":[229],"challenge":[233],"task":[234],"analysis:":[239],"Identifying":[240],"Original":[241],"Speaker":[242],"videos":[245],"(IOS).":[246],"advantages":[248],"proposed":[251],"over":[253],"traditional":[254],"representations":[257],"highlight":[258],"for":[263],"robust":[264],"both":[268],"real":[269]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
