{"id":"https://openalex.org/W7124926458","doi":"https://doi.org/10.1109/tvcg.2026.3655478","title":"Make-Your-Anchor+: Temporal Consistent 2D Avatar Generation via Video Diffusion Prior","display_name":"Make-Your-Anchor+: Temporal Consistent 2D Avatar Generation via Video Diffusion Prior","publication_year":2026,"publication_date":"2026-01-19","ids":{"openalex":"https://openalex.org/W7124926458","doi":"https://doi.org/10.1109/tvcg.2026.3655478","pmid":"https://pubmed.ncbi.nlm.nih.gov/41553909"},"language":"en","primary_location":{"id":"doi:10.1109/tvcg.2026.3655478","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvcg.2026.3655478","pdf_url":null,"source":{"id":"https://openalex.org/S84775595","display_name":"IEEE Transactions on Visualization and Computer Graphics","issn_l":"1077-2626","issn":["1077-2626","1941-0506","2160-9306"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Visualization and Computer Graphics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123396053","display_name":"Ziyao Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziyao Huang","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0004-3141-9979","affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121570216","display_name":"Fan Tang","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fan Tang","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3975-2483","affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Juan Cao","orcid":"https://orcid.org/0000-0002-7857-1546"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Juan Cao","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-7857-1546","affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123430629","display_name":"Yong Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Zhang","raw_affiliation_strings":["Tencent, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-0066-3448","affiliations":[{"raw_affiliation_string":"Tencent, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123418766","display_name":"Xiaodong Cun","orcid":null},"institutions":[{"id":"https://openalex.org/I4396570619","display_name":"Great Bay University","ror":"https://ror.org/01hdgge16","country_code":null,"type":"education","lineage":["https://openalex.org/I4396570619"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaodong Cun","raw_affiliation_strings":["Great Bay University, Guangdong, China"],"raw_orcid":"https://orcid.org/0000-0003-3607-2236","affiliations":[{"raw_affiliation_string":"Great Bay University, Guangdong, China","institution_ids":["https://openalex.org/I4396570619"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059812401","display_name":"Yihang Bo","orcid":"https://orcid.org/0009-0005-0060-6621"},"institutions":[{"id":"https://openalex.org/I2802536167","display_name":"Beijing Film Academy","ror":"https://ror.org/03y0w9190","country_code":"CN","type":"education","lineage":["https://openalex.org/I2802536167"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yihang Bo","raw_affiliation_strings":["Beijing Film Academy, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Film Academy, Beijing, China","institution_ids":["https://openalex.org/I2802536167"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123417345","display_name":"Jintao Li","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jintao Li","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123393977","display_name":"Tong-Yee Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Tong-Yee Lee","raw_affiliation_strings":["National Cheng Kung University, Tainan, Taiwan"],"raw_orcid":"https://orcid.org/0000-0001-6699-2944","affiliations":[{"raw_affiliation_string":"National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07689854,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"32","issue":"4","first_page":"2883","last_page":"2897"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.6362000107765198,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.6362000107765198,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.3028999865055084,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.006099999882280827,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/torso","display_name":"Torso","score":0.552299976348877},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.49799999594688416},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4943999946117401},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4754999876022339},{"id":"https://openalex.org/keywords/avatar","display_name":"Avatar","score":0.45879998803138733},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4318999946117401},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.4251999855041504},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.3910999894142151},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.37880000472068787}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8657000064849854},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7562000155448914},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7282999753952026},{"id":"https://openalex.org/C523889960","wikidata":"https://www.wikidata.org/wiki/Q160695","display_name":"Torso","level":2,"score":0.552299976348877},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.49799999594688416},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4943999946117401},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4754999876022339},{"id":"https://openalex.org/C2777365542","wikidata":"https://www.wikidata.org/wiki/Q83090","display_name":"Avatar","level":2,"score":0.45879998803138733},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4318999946117401},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.4251999855041504},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3910999894142151},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.37880000472068787},{"id":"https://openalex.org/C30814859","wikidata":"https://www.wikidata.org/wiki/Q4119603","display_name":"Video denoising","level":5,"score":0.36649999022483826},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.3303999900817871},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.32179999351501465},{"id":"https://openalex.org/C68710425","wikidata":"https://www.wikidata.org/wiki/Q5275442","display_name":"Diffusion process","level":3,"score":0.3190000057220459},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.3109999895095825},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.30660000443458557},{"id":"https://openalex.org/C2780575108","wikidata":"https://www.wikidata.org/wiki/Q7316652","display_name":"Retargeting","level":2,"score":0.29910001158714294},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.2948000133037567},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.2897999882698059},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2815000116825104},{"id":"https://openalex.org/C160086991","wikidata":"https://www.wikidata.org/wiki/Q5939193","display_name":"Human visual system model","level":3,"score":0.27549999952316284},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.27160000801086426},{"id":"https://openalex.org/C83248878","wikidata":"https://www.wikidata.org/wiki/Q344000","display_name":"Active appearance model","level":3,"score":0.262800008058548},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.25369998812675476}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tvcg.2026.3655478","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvcg.2026.3655478","pdf_url":null,"source":{"id":"https://openalex.org/S84775595","display_name":"IEEE Transactions on Visualization and Computer Graphics","issn_l":"1077-2626","issn":["1077-2626","1941-0506","2160-9306"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Visualization and Computer Graphics","raw_type":"journal-article"},{"id":"pmid:41553909","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41553909","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on visualization and computer graphics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8887096489","display_name":null,"funder_award_id":"62572458","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Despite":[0],"the":[1,39,77,116,141,159,166,172],"remarkable":[2],"process":[3],"of":[4,32,42,162],"talking-head-based":[5],"avatar-creating":[6],"solutions,":[7],"directly":[8],"generating":[9],"anchor-style":[10,43],"videos":[11,44],"with":[12,45,83,125],"full-body":[13],"motions":[14],"remains":[15],"challenging.":[16],"In":[17],"this":[18],"study,":[19],"we":[20,52,105],"propose":[21],"Make-Your-Anchor+,":[22],"a":[23,28,54,72,129,149],"novel":[24,150],"system":[25],"necessitating":[26],"only":[27],"one-minute":[29],"video":[30,61,111,122,144],"clip":[31],"an":[33],"individual":[34],"for":[35,76,90],"training,":[36],"subsequently":[37],"enabling":[38],"automatic":[40],"generation":[41],"precise":[46],"torso":[47],"and":[48,96,128,175,182],"hand":[49],"movements.":[50],"Specifically,":[51],"finetune":[53],"proposed":[55,138],"structure-guided":[56],"diffusion":[57,78,112,118,123],"model":[58,119],"on":[59,143],"input":[60],"to":[62,86,120,139,157],"render":[63],"3D":[64],"mesh":[65],"conditions":[66],"into":[67],"human":[68,107],"appearances.":[69],"We":[70],"adopt":[71],"two-stage":[73],"training":[74],"strategy":[75],"model,":[79],"effectively":[80],"mapping":[81],"movements":[82],"specific":[84],"appearances":[85],"create":[87],"digital":[88],"avatars":[89],"online":[91],"streamers,":[92],"live":[93],"shopping":[94],"hosts,":[95],"other":[97],"applications.":[98],"To":[99],"produce":[100],"arbitrary":[101],"long":[102],"temporal":[103,134,180],"video,":[104],"extract":[106],"motion":[108],"information":[109],"from":[110],"prior":[113],"by":[114],"adapting":[115],"frame-wise":[117],"pretrained":[121],"weights":[124],"lower":[126],"cost,":[127],"simple":[130],"yet":[131],"effective":[132],"batch-overlapped":[133],"denoising":[135],"module":[136,154],"is":[137,155],"bypass":[140],"constraints":[142],"length":[145],"during":[146],"inference.":[147],"Finally,":[148],"identity-specific":[151],"face":[152],"enhancement":[153],"introduced":[156],"improve":[158],"visual":[160,178],"quality":[161],"facial":[163],"regions":[164],"in":[165,177],"output":[167],"videos.":[168],"Comparative":[169],"experiments":[170],"demonstrate":[171],"system's":[173],"effectiveness":[174],"superiority":[176],"quality,":[179],"coherence,":[181],"identity":[183],"preservation,":[184],"outperforming":[185],"SOTA":[186],"diffusion/non-diffusion":[187],"methods.":[188]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-01-21T00:00:00"}
