{"id":"https://openalex.org/W7128424260","doi":"https://doi.org/10.1109/jstsp.2026.3662496","title":"StyleAvatar3D: Leveraging Image-Text Diffusion Models for High-Fidelity 3D Avatar Generation","display_name":"StyleAvatar3D: Leveraging Image-Text Diffusion Models for High-Fidelity 3D Avatar Generation","publication_year":2026,"publication_date":"2026-02-09","ids":{"openalex":"https://openalex.org/W7128424260","doi":"https://doi.org/10.1109/jstsp.2026.3662496"},"language":"en","primary_location":{"id":"doi:10.1109/jstsp.2026.3662496","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2026.3662496","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125467866","display_name":"Chi Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I3133055985","display_name":"Westlake University","ror":"https://ror.org/05hfa4n20","country_code":"CN","type":"education","lineage":["https://openalex.org/I3133055985"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chi Zhang","raw_affiliation_strings":["Westlake University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-6344-2824","affiliations":[{"raw_affiliation_string":"Westlake University, Hangzhou, China","institution_ids":["https://openalex.org/I3133055985"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125453336","display_name":"Yiwen Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yiwen Chen","raw_affiliation_strings":["Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0009-0006-7945-6028","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yijun Fu","orcid":"https://orcid.org/0009-0007-6885-7595"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yijun Fu","raw_affiliation_strings":["Tencent PCG, Shenzhen, Guangdong, China"],"raw_orcid":"https://orcid.org/0009-0007-6885-7595","affiliations":[{"raw_affiliation_string":"Tencent PCG, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125468954","display_name":"Wei Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Cheng","raw_affiliation_strings":["Tencent PCG, Shenzhen, Guangdong, China"],"raw_orcid":"https://orcid.org/0000-0003-0088-4398","affiliations":[{"raw_affiliation_string":"Tencent PCG, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125469635","display_name":"Zhenglin Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenglin Zhou","raw_affiliation_strings":["Tencent PCG, Shenzhen, Guangdong, China"],"raw_orcid":"https://orcid.org/0000-0002-5886-0906","affiliations":[{"raw_affiliation_string":"Tencent PCG, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Wenjia Jiang","orcid":"https://orcid.org/0009-0006-6067-1334"},"institutions":[{"id":"https://openalex.org/I3133055985","display_name":"Westlake University","ror":"https://ror.org/05hfa4n20","country_code":"CN","type":"education","lineage":["https://openalex.org/I3133055985"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenjia Jiang","raw_affiliation_strings":["Westlake University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0006-6067-1334","affiliations":[{"raw_affiliation_string":"Westlake University, Hangzhou, China","institution_ids":["https://openalex.org/I3133055985"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhibin Wang","orcid":"https://orcid.org/0009-0008-0314-2422"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhibin Wang","raw_affiliation_strings":["Tencent PCG, Shenzhen, Guangdong, China"],"raw_orcid":"https://orcid.org/0009-0008-0314-2422","affiliations":[{"raw_affiliation_string":"Tencent PCG, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Bin Fu","orcid":"https://orcid.org/0000-0002-5277-8709"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Fu","raw_affiliation_strings":["Tencent PCG, Shenzhen, Guangdong, China"],"raw_orcid":"https://orcid.org/0000-0002-5277-8709","affiliations":[{"raw_affiliation_string":"Tencent PCG, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125452596","display_name":"Tao Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Chen","raw_affiliation_strings":["Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-0779-9818","affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Gang Yu","orcid":"https://orcid.org/0000-0001-5570-2710"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gang Yu","raw_affiliation_strings":["Tencent PCG, Shenzhen, Guangdong, China"],"raw_orcid":"https://orcid.org/0000-0001-5570-2710","affiliations":[{"raw_affiliation_string":"Tencent PCG, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077750111","display_name":"Guosheng Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Guosheng Lin","raw_affiliation_strings":["Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-0329-7458","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5125435387","display_name":"Chenxi Song","orcid":null},"institutions":[{"id":"https://openalex.org/I3133055985","display_name":"Westlake University","ror":"https://ror.org/05hfa4n20","country_code":"CN","type":"education","lineage":["https://openalex.org/I3133055985"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenxi Song","raw_affiliation_strings":["Westlake University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-2542-9204","affiliations":[{"raw_affiliation_string":"Westlake University, Hangzhou, China","institution_ids":["https://openalex.org/I3133055985"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5125467866"],"corresponding_institution_ids":["https://openalex.org/I3133055985"],"apc_list":null,"apc_paid":null,"fwci":55.8898,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.99711014,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"20","issue":"2","first_page":"192","last_page":"201"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8945000171661377,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8945000171661377,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.023800000548362732,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.02250000089406967,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stylized-fact","display_name":"Stylized fact","score":0.7143999934196472},{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.5996000170707703},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.45910000801086426},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.4171000123023987},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.40700000524520874},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.3953000009059906},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.3921999931335449},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.383899986743927},{"id":"https://openalex.org/keywords/solid-modeling","display_name":"Solid modeling","score":0.3736000061035156}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8277000188827515},{"id":"https://openalex.org/C38935604","wikidata":"https://www.wikidata.org/wiki/Q4330363","display_name":"Stylized fact","level":2,"score":0.7143999934196472},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.5996000170707703},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5680999755859375},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4797999858856201},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.45910000801086426},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.4171000123023987},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.40700000524520874},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3953000009059906},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.3921999931335449},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.383899986743927},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.3736000061035156},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.37220001220703125},{"id":"https://openalex.org/C2777365542","wikidata":"https://www.wikidata.org/wiki/Q83090","display_name":"Avatar","level":2,"score":0.37130001187324524},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.3538999855518341},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33079999685287476},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.32690000534057617},{"id":"https://openalex.org/C2777897806","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3D modeling","level":2,"score":0.2992999851703644},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.28839999437332153},{"id":"https://openalex.org/C3019007443","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3d model","level":2,"score":0.28529998660087585},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.2840000092983246},{"id":"https://openalex.org/C205203396","wikidata":"https://www.wikidata.org/wiki/Q612143","display_name":"Bilinear interpolation","level":2,"score":0.27160000801086426},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.26489999890327454},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2628999948501587},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2563000023365021}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/jstsp.2026.3662496","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2026.3662496","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/212182","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/212182","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.571553647518158,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G5961903033","display_name":null,"funder_award_id":"6250070674","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"recent":[1],"advancements":[2],"in":[3,11,84,159],"image-text":[4,46,75],"diffusion":[5,47,76,130],"models":[6,48,77,97],"have":[7],"stimulated":[8],"research":[9],"interest":[10],"large-scale":[12],"3D":[13,22,41,58,96],"generative":[14],"models.":[15],"Nevertheless,":[16],"the":[17,66,100,133,140,167],"limited":[18],"availability":[19],"of":[20,69,82,102,110,136,142,161,166],"diverse":[21],"resources":[23],"presents":[24],"significant":[25],"challenges":[26],"to":[27,78,98,138],"learning.":[28],"In":[29],"this":[30],"paper,":[31],"we":[32,90,113,126],"present":[33],"a":[34,53,119,128],"novel":[35],"method":[36,64],"for":[37,49,61,122],"generating":[38],"high-quality,":[39],"stylized":[40,111],"avatars":[42,83,143],"that":[43],"utilizes":[44],"pre-trained":[45],"data":[50,88],"generation":[51,59,101,141],"and":[52,71,117,164],"Generative":[54],"Adversarial":[55],"Network":[56],"(GAN)-based":[57],"network":[60],"training.":[62,124],"Our":[63,150],"leverages":[65],"comprehensive":[67],"priors":[68],"appearance":[70],"geometry":[72],"offered":[73],"by":[74],"generate":[79],"multi-view":[80,103],"images":[81],"various":[85],"styles.":[86],"During":[87],"generation,":[89],"employ":[91],"poses":[92],"extracted":[93],"from":[94],"existing":[95],"guide":[99],"images.":[104],"To":[105],"handle":[106],"inaccurate":[107],"pose":[108],"annotations":[109],"images,":[112],"investigate":[114],"view-specific":[115],"prompts":[116],"develop":[118,127],"coarse-to-fine":[120],"discriminator":[121],"GAN":[123],"Additionally,":[125],"latent":[129],"model":[131],"within":[132],"style":[134],"space":[135],"StyleGAN":[137],"enable":[139],"based":[144],"on":[145],"image":[146],"or":[147],"text":[148],"inputs.":[149],"approach":[151],"demonstrates":[152],"superior":[153],"performance":[154],"over":[155],"current":[156],"state-of-the-art":[157],"methods":[158],"terms":[160],"visual":[162],"quality":[163],"diversity":[165],"produced":[168],"avatars.":[169]},"counts_by_year":[{"year":2026,"cited_by_count":2}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2026-02-10T00:00:00"}
