{"id":"https://openalex.org/W7128402582","doi":"https://doi.org/10.48550/arxiv.2602.06122","title":"From Blurry to Believable: Enhancing Low-quality Talking Heads with 3D Generative Priors","display_name":"From Blurry to Believable: Enhancing Low-quality Talking Heads with 3D Generative Priors","publication_year":2026,"publication_date":"2026-02-05","ids":{"openalex":"https://openalex.org/W7128402582","doi":"https://doi.org/10.48550/arxiv.2602.06122"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.06122","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111024343","display_name":"Ding-Jiun Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Huang, Ding-Jiun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125400720","display_name":"Yuanhao Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yuanhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065481040","display_name":"Shao-Ji Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Shao-Ji","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125391100","display_name":"Albert Mosella-Montoro","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mosella-Montoro, Albert","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047750700","display_name":"Francisco Vicente Carrasco","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Carrasco, Francisco Vicente","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125378005","display_name":"Cheng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Cheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125379503","display_name":"Fernando De la Torre","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"De la Torre, Fernando","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5111024343"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.6743999719619751,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.6743999719619751,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.2856999933719635,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.006399999838322401,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.7245000004768372},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.48350000381469727},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4821999967098236},{"id":"https://openalex.org/keywords/animation","display_name":"Animation","score":0.46860000491142273},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.43860000371932983},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.3962000012397766},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.3668999969959259},{"id":"https://openalex.org/keywords/computer-facial-animation","display_name":"Computer facial animation","score":0.3646000027656555},{"id":"https://openalex.org/keywords/view-synthesis","display_name":"View synthesis","score":0.34700000286102295}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7746000289916992},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.7245000004768372},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6791999936103821},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5758000016212463},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.48350000381469727},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4821999967098236},{"id":"https://openalex.org/C502989409","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Animation","level":2,"score":0.46860000491142273},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.43860000371932983},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.3962000012397766},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.3668999969959259},{"id":"https://openalex.org/C138591656","wikidata":"https://www.wikidata.org/wiki/Q5157538","display_name":"Computer facial animation","level":4,"score":0.3646000027656555},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.34700000286102295},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3433000147342682},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.34209999442100525},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.34200000762939453},{"id":"https://openalex.org/C83248878","wikidata":"https://www.wikidata.org/wiki/Q344000","display_name":"Active appearance model","level":3,"score":0.3221000134944916},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.31949999928474426},{"id":"https://openalex.org/C1893757","wikidata":"https://www.wikidata.org/wiki/Q3653001","display_name":"Inversion (geology)","level":3,"score":0.31709998846054077},{"id":"https://openalex.org/C109950114","wikidata":"https://www.wikidata.org/wiki/Q4464732","display_name":"3D reconstruction","level":2,"score":0.30329999327659607},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.2985999882221222},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2921999990940094},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C69369342","wikidata":"https://www.wikidata.org/wiki/Q1401416","display_name":"Computer animation","level":3,"score":0.28040000796318054},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.2533999979496002},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.2517000138759613},{"id":"https://openalex.org/C3019007443","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3d model","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.06122","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.06122","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.06122","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.06122","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"display_name":"No poverty","id":"https://metadata.un.org/sdg/1","score":0.41840535402297974}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Creating":[0],"high-fidelity,":[1],"animatable":[2,40],"3D":[3,26,41,57,85,97,104,121],"talking":[4],"heads":[5],"is":[6,128,143],"crucial":[7],"for":[8,37,139],"immersive":[9],"applications,":[10],"yet":[11],"often":[12],"hindered":[13],"by":[14],"the":[15,92,110,114],"prevalence":[16],"of":[17,113,150],"low-quality":[18],"image":[19],"or":[20],"video":[21,72],"sources,":[22],"which":[23,127],"yield":[24],"poor":[25],"reconstructions.":[27],"In":[28],"this":[29],"paper,":[30],"we":[31],"introduce":[32],"SuperHead,":[33],"a":[34,101,119,147],"novel":[35,102],"framework":[36],"enhancing":[38],"low-resolution,":[39],"head":[42,125,135],"avatars.":[43],"The":[44,141],"core":[45],"challenge":[46],"lies":[47],"in":[48,70,191],"synthesizing":[49],"high-quality":[50],"geometry":[51],"and":[52,58,63,73,155,164],"textures,":[53],"while":[54],"ensuring":[55],"both":[56],"temporal":[59],"consistency":[60],"during":[61],"animation":[62],"preserving":[64],"subject":[65],"identity.":[66],"Despite":[67],"recent":[68],"progress":[69],"image,":[71],"3D-based":[74],"super-resolution":[75],"(SR),":[76],"existing":[77],"SR":[78],"techniques":[79],"are":[80],"ill-equipped":[81],"to":[82,117,131,167],"handle":[83],"dynamic":[84,171,185],"inputs.":[86],"To":[87],"address":[88],"this,":[89],"SuperHead":[90,177],"leverages":[91],"rich":[93],"priors":[94],"from":[95,160],"pre-trained":[96],"generative":[98,115],"models":[99],"via":[100],"dynamics-aware":[103],"inversion":[105,142],"scheme.":[106],"This":[107],"process":[108],"optimizes":[109],"latent":[111],"representation":[112],"model":[116,136],"produce":[118],"super-resolved":[120],"Gaussian":[122],"Splatting":[123],"(3DGS)":[124],"model,":[126],"subsequently":[129],"rigged":[130],"an":[132],"underlying":[133],"parametric":[134],"(e.g.,":[137],"FLAME)":[138],"animation.":[140],"jointly":[144],"supervised":[145],"using":[146],"sparse":[148],"collection":[149],"upscaled":[151],"2D":[152],"face":[153],"renderings":[154],"corresponding":[156],"depth":[157],"maps,":[158],"captured":[159],"diverse":[161],"facial":[162,172,182],"expressions":[163],"camera":[165],"viewpoints,":[166],"ensure":[168],"realism":[169],"under":[170,184],"motions.":[173],"Experiments":[174],"demonstrate":[175],"that":[176],"generates":[178],"avatars":[179],"with":[180],"fine-grained":[181],"details":[183],"motions,":[186],"significantly":[187],"outperforming":[188],"baseline":[189],"methods":[190],"visual":[192],"quality.":[193]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-10T00:00:00"}
