{"id":"https://openalex.org/W4415428508","doi":"https://doi.org/10.3233/faia251143","title":"D3-Talker: Dual-Branch Decoupled Deformation Fields for Few-Shot 3D Talking Head Synthesis","display_name":"D3-Talker: Dual-Branch Decoupled Deformation Fields for Few-Shot 3D Talking Head Synthesis","publication_year":2025,"publication_date":"2025-10-21","ids":{"openalex":"https://openalex.org/W4415428508","doi":"https://doi.org/10.3233/faia251143"},"language":null,"primary_location":{"id":"doi:10.3233/faia251143","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251143","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/faia251143","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026009881","display_name":"Ye Guo","orcid":"https://orcid.org/0000-0002-1813-9815"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I97750245","display_name":"Software (Spain)","ror":"https://ror.org/02ethns06","country_code":"ES","type":"company","lineage":["https://openalex.org/I4210087817","https://openalex.org/I97750245"]}],"countries":["CN","ES"],"is_corresponding":false,"raw_author_name":"Yuhang Guo","raw_affiliation_strings":["School of Computer Science and Software Engineering, Shenzhen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Software Engineering, Shenzhen University","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I97750245"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032382826","display_name":"Ying Deng","orcid":"https://orcid.org/0000-0003-4643-3525"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I97750245","display_name":"Software (Spain)","ror":"https://ror.org/02ethns06","country_code":"ES","type":"company","lineage":["https://openalex.org/I4210087817","https://openalex.org/I97750245"]}],"countries":["CN","ES"],"is_corresponding":false,"raw_author_name":"Kaijun Deng","raw_affiliation_strings":["School of Computer Science and Software Engineering, Shenzhen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Software Engineering, Shenzhen University","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I97750245"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032668841","display_name":"Siyang Song","orcid":"https://orcid.org/0000-0001-8325-0133"},"institutions":[{"id":"https://openalex.org/I23923803","display_name":"University of Exeter","ror":"https://ror.org/03yghzc09","country_code":"GB","type":"education","lineage":["https://openalex.org/I23923803"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Siyang Song","raw_affiliation_strings":["HBUG Lab, University of Exeter"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"HBUG Lab, University of Exeter","institution_ids":["https://openalex.org/I23923803"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102734730","display_name":"Jindong Xie","orcid":"https://orcid.org/0000-0002-1330-0040"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I97750245","display_name":"Software (Spain)","ror":"https://ror.org/02ethns06","country_code":"ES","type":"company","lineage":["https://openalex.org/I4210087817","https://openalex.org/I97750245"]}],"countries":["CN","ES"],"is_corresponding":false,"raw_author_name":"Jindong Xie","raw_affiliation_strings":["School of Computer Science and Software Engineering, Shenzhen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Software Engineering, Shenzhen University","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I97750245"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018507572","display_name":"Wenhui Ma","orcid":"https://orcid.org/0000-0001-5283-251X"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I97750245","display_name":"Software (Spain)","ror":"https://ror.org/02ethns06","country_code":"ES","type":"company","lineage":["https://openalex.org/I4210087817","https://openalex.org/I97750245"]}],"countries":["CN","ES"],"is_corresponding":false,"raw_author_name":"Wenhui Ma","raw_affiliation_strings":["School of Computer Science and Software Engineering, Shenzhen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Software Engineering, Shenzhen University","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I97750245"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019313200","display_name":"Linlin Shen","orcid":"https://orcid.org/0000-0003-1420-0815"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I4210105229","display_name":"City University of Hong Kong, Shenzhen Research Institute","ror":"https://ror.org/00xc0ma20","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210105229"]},{"id":"https://openalex.org/I4210142539","display_name":"Guangdong Institute of Intelligent Manufacturing","ror":"https://ror.org/049jpjz09","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210142539"]},{"id":"https://openalex.org/I97750245","display_name":"Software (Spain)","ror":"https://ror.org/02ethns06","country_code":"ES","type":"company","lineage":["https://openalex.org/I4210087817","https://openalex.org/I97750245"]}],"countries":["CN","ES"],"is_corresponding":false,"raw_author_name":"Linlin Shen","raw_affiliation_strings":["Computer Vision Institute, School of Artificial Intelligence, Shenzhen University, Shenzhen, China","Guangdong Provincial Key Laboratory of Intelligent Information Processing","School of Computer Science and Software Engineering, Shenzhen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computer Vision Institute, School of Artificial Intelligence, Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I4210105229"]},{"raw_affiliation_string":"Guangdong Provincial Key Laboratory of Intelligent Information Processing","institution_ids":["https://openalex.org/I4210142539"]},{"raw_affiliation_string":"School of Computer Science and Software Engineering, Shenzhen University","institution_ids":["https://openalex.org/I180726961","https://openalex.org/I97750245"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.64598619,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.8575999736785889,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.8575999736785889,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10789","display_name":"Interactive and Immersive Displays","score":0.8522999882698059,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10783","display_name":"Additive Manufacturing and 3D Printing Technologies","score":0.8496999740600586,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.6642000079154968},{"id":"https://openalex.org/keywords/head","display_name":"Head (geology)","score":0.4361000061035156},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.35370001196861267},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.3449000120162964},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.3386000096797943},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.3257000148296356},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.30140000581741333}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7452999949455261},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.6642000079154968},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6432999968528748},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6226000189781189},{"id":"https://openalex.org/C2780312720","wikidata":"https://www.wikidata.org/wiki/Q5689100","display_name":"Head (geology)","level":2,"score":0.4361000061035156},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.38920000195503235},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.35370001196861267},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.3449000120162964},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.3386000096797943},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.3257000148296356},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.30140000581741333},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.28760001063346863},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.28690001368522644},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2808000147342682},{"id":"https://openalex.org/C77660652","wikidata":"https://www.wikidata.org/wiki/Q150971","display_name":"Computer graphics","level":2,"score":0.2786000072956085},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.27810001373291016},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.26989999413490295},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2551000118255615},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2542000114917755}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/faia251143","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251143","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/faia251143","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251143","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"A":[0],"key":[1],"challenge":[2],"in":[3,9,68,173],"3D":[4,99],"talking":[5,15,84],"head":[6,16,85,158],"synthesis":[7],"lies":[8],"the":[10,61,69,121,151],"reliance":[11],"on":[12,74],"a":[13,20,76,92,97,130,146],"long-duration":[14],"video":[17],"to":[18,33,52,59,64,110,138,149],"train":[19],"new":[21],"model":[22],"for":[23],"each":[24],"target":[25,70],"identity":[26],"from":[27,41],"scratch.":[28],"Recent":[29],"methods":[30,172],"have":[31],"attempted":[32],"address":[34],"this":[35],"issue":[36],"by":[37,157],"extracting":[38],"general":[39,124],"features":[40],"audio":[42,48,63,105],"through":[43],"pre-training":[44,137],"models.":[45],"However,":[46],"since":[47],"contains":[49],"information":[50],"irrelevant":[51],"lip":[53,66,81],"motion,":[54],"existing":[55],"approaches":[56],"typically":[57],"struggle":[58],"map":[60],"given":[62],"realistic":[65],"behaviors":[67],"face":[71],"when":[72],"trained":[73],"only":[75],"few":[77],"frames,":[78],"causing":[79],"poor":[80],"synchronization":[82,180],"and":[83,103,106,125,160,177],"image":[86,163],"quality.":[87,164],"This":[88],"paper":[89],"proposes":[90],"D3-Talker,":[91],"novel":[93,131],"approach":[94],"that":[95,168],"constructs":[96],"static":[98],"Gaussian":[100,115],"attribute":[101,116],"field":[102],"employs":[104],"Facial":[107],"Motion":[108],"signals":[109],"independently":[111],"control":[112],"two":[113],"distinct":[114],"deformation":[117],"fields,":[118],"effectively":[119],"decoupling":[120],"predictions":[122],"of":[123],"personalized":[126],"deformations.":[127],"We":[128],"design":[129],"similarity":[132],"contrastive":[133],"loss":[134],"function":[135],"during":[136],"achieve":[139],"more":[140],"thorough":[141],"decoupling.":[142],"Furthermore,":[143],"we":[144],"integrate":[145],"Coarse-to-Fine":[147],"module":[148],"refine":[150],"rendered":[152],"images,":[153],"alleviating":[154],"blurriness":[155],"caused":[156],"movements":[159],"enhancing":[161],"overall":[162],"Extensive":[165],"experiments":[166],"demonstrate":[167],"D3-Talker":[169],"outperforms":[170],"state-of-the-art":[171],"both":[174],"high-fidelity":[175],"rendering":[176],"accurate":[178],"audio-lip":[179],"with":[181],"limited":[182],"training":[183],"data.":[184]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-24T00:00:00"}
