{"id":"https://openalex.org/W7160520991","doi":"https://doi.org/10.48550/arxiv.2605.04702","title":"FaithfulFaces: Pose-Faithful Facial Identity Preservation for Text-to-Video Generation","display_name":"FaithfulFaces: Pose-Faithful Facial Identity Preservation for Text-to-Video Generation","publication_year":2026,"publication_date":"2026-05-06","ids":{"openalex":"https://openalex.org/W7160520991","doi":"https://doi.org/10.48550/arxiv.2605.04702"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.04702","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04702","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.04702","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135623327","display_name":"Yuanzhi Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yuanzhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135593692","display_name":"Xuhua Ren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Xuhua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008859889","display_name":"Jiaxiang Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Jiaxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135587114","display_name":"Bing Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Bing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135578354","display_name":"Kai Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Kai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135621437","display_name":"Sen Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Sen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101684085","display_name":"Wenyue Li","orcid":"https://orcid.org/0000-0003-4748-982X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Wenyue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135626403","display_name":"Tianxiang Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Tianxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135616001","display_name":"Qinglin Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Qinglin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135551682","display_name":"Zhen Cui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Zhen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9523000121116638,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9523000121116638,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.03720000013709068,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.002199999988079071,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.6782000064849854},{"id":"https://openalex.org/keywords/clarity","display_name":"CLARITY","score":0.512499988079071},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.48249998688697815},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.46299999952316284},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.39559999108314514},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.3418000042438507},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.3337000012397766}],"concepts":[{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.6782000064849854},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5486999750137329},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.532800018787384},{"id":"https://openalex.org/C2777146004","wikidata":"https://www.wikidata.org/wiki/Q14949826","display_name":"CLARITY","level":2,"score":0.512499988079071},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.48249998688697815},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.46299999952316284},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.41909998655319214},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.39559999108314514},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.35199999809265137},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.3418000042438507},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.3337000012397766},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.3334999978542328},{"id":"https://openalex.org/C31510193","wikidata":"https://www.wikidata.org/wiki/Q1192553","display_name":"Facial recognition system","level":3,"score":0.3296999931335449},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.301800012588501},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.2976999878883362},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2741999924182892}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.04702","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04702","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.04702","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04702","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Identity-preserving":[0],"text-to-video":[1],"generation":[2],"(IPT2V)":[3],"empowers":[4],"users":[5],"to":[6,49,120],"produce":[7],"diverse":[8],"and":[9,67,78,143,150],"imaginative":[10],"videos":[11],"with":[12,94],"consistent":[13],"human":[14],"facial":[15,30,34,44,69,91,103,128],"identity.":[16],"Despite":[17],"recent":[18],"progress,":[19],"existing":[20],"methods":[21],"often":[22],"suffer":[23],"from":[24],"significant":[25],"identity":[26,45,63,141],"distortion":[27],"under":[28],"large":[29],"pose":[31,80,92,129,148],"variations":[32],"or":[33],"occlusions.":[35],"In":[36,113],"this":[37],"paper,":[38],"we":[39,115],"propose":[40],"\\textit{FaithfulFaces},":[41],"a":[42,61,75,79,89,101,117,122],"pose-faithful":[43,102],"preservation":[46],"learning":[47],"framework":[48],"improve":[50],"IPT2V":[51],"in":[52],"complex":[53],"dynamic":[54],"scenes.":[55],"The":[56],"key":[57],"of":[58],"FaithfulFaces":[59,99,135],"is":[60],"pose-shared":[62,76],"aligner":[64],"that":[65,105,134],"refines":[66],"aligns":[68],"poses":[70],"across":[71],"distinct":[72],"views":[73],"via":[74],"dictionary":[77],"variation-identity":[81],"invariance":[82],"constraint.":[83],"By":[84],"mapping":[85],"single-view":[86],"inputs":[87],"into":[88],"global":[90],"representation":[93],"explicit":[95],"Euler":[96],"angle":[97],"embeddings,":[98],"provides":[100],"prior":[104],"guides":[106],"generative":[107],"foundations":[108],"toward":[109],"robust":[110],"identity-preserving":[111],"generation.":[112],"particular,":[114],"develop":[116],"specialized":[118],"pipeline":[119],"curate":[121],"high-quality":[123],"video":[124],"dataset":[125],"featuring":[126],"substantial":[127],"diversity.":[130],"Extensive":[131],"experiments":[132],"demonstrate":[133],"achieves":[136],"state-of-the-art":[137],"performance,":[138],"maintaining":[139],"superior":[140],"consistency":[142],"structural":[144],"clarity":[145],"even":[146],"as":[147],"changes":[149],"occlusions":[151],"occur.":[152]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-08T00:00:00"}
