{"id":"https://openalex.org/W4388469765","doi":"https://doi.org/10.1109/tcsvt.2023.3330920","title":"FaceCLIP: Facial Image-to-Video Translation via a Brief Text Description","display_name":"FaceCLIP: Facial Image-to-Video Translation via a Brief Text Description","publication_year":2023,"publication_date":"2023-11-07","ids":{"openalex":"https://openalex.org/W4388469765","doi":"https://doi.org/10.1109/tcsvt.2023.3330920"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2023.3330920","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3330920","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100537605","display_name":"Jiayi Guo","orcid":"https://orcid.org/0009-0005-7004-939X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiayi Guo","raw_affiliation_strings":["Department of Automation, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093218085","display_name":"Hayk Manukyan","orcid":"https://orcid.org/0009-0004-4848-1656"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hayk Manukyan","raw_affiliation_strings":["PicsArt AI Research (PAIR), Eugene, Armenia"],"affiliations":[{"raw_affiliation_string":"PicsArt AI Research (PAIR), Eugene, Armenia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101678003","display_name":"Chenyu Yang","orcid":"https://orcid.org/0000-0001-9997-4929"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenyu Yang","raw_affiliation_strings":["Institute for Interdisciplinary Information Sciences, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute for Interdisciplinary Information Sciences, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052308386","display_name":"Chaofei Wang","orcid":"https://orcid.org/0000-0002-3678-691X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chaofei Wang","raw_affiliation_strings":["Department of Automation, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006954388","display_name":"Levon Khachatryan","orcid":"https://orcid.org/0000-0002-5840-760X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Levon Khachatryan","raw_affiliation_strings":["PicsArt AI Research (PAIR), Eugene, Armenia"],"affiliations":[{"raw_affiliation_string":"PicsArt AI Research (PAIR), Eugene, Armenia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036843155","display_name":"Shant Navasardyan","orcid":"https://orcid.org/0000-0002-1999-9999"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shant Navasardyan","raw_affiliation_strings":["PicsArt AI Research (PAIR), Eugene, Armenia"],"affiliations":[{"raw_affiliation_string":"PicsArt AI Research (PAIR), Eugene, Armenia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101868179","display_name":"Shiji Song","orcid":"https://orcid.org/0000-0003-0858-1770"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiji Song","raw_affiliation_strings":["Department of Automation, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002072267","display_name":"Humphrey Shi","orcid":"https://orcid.org/0000-0002-2922-5663"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]},{"id":"https://openalex.org/I181233156","display_name":"University of Oregon","ror":"https://ror.org/0293rh119","country_code":"US","type":"education","lineage":["https://openalex.org/I181233156"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Humphrey Shi","raw_affiliation_strings":["PicsArt AI Research (PAIR), Eugene, Armenia","University of Oregon, the University of Illinois at Urbana-Champaign, USA"],"affiliations":[{"raw_affiliation_string":"PicsArt AI Research (PAIR), Eugene, Armenia","institution_ids":[]},{"raw_affiliation_string":"University of Oregon, the University of Illinois at Urbana-Champaign, USA","institution_ids":["https://openalex.org/I157725225","https://openalex.org/I181233156"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013240918","display_name":"Gao Huang","orcid":"https://orcid.org/0000-0002-7251-0988"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gao Huang","raw_affiliation_strings":["Department of Automation, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5100537605"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":1.1948,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.81632387,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"34","issue":"6","first_page":"4270","last_page":"4284"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.984000027179718,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.855186939239502},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7247325778007507},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.6163685917854309},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.5271294116973877},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.504768967628479},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4871046543121338},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.47835487127304077},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.4758194088935852},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.43852055072784424},{"id":"https://openalex.org/keywords/facial-expression","display_name":"Facial expression","score":0.42969274520874023},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36785823106765747},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3585846722126007},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3550637364387512},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.3500880300998688},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.33084818720817566},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.32638823986053467}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.855186939239502},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7247325778007507},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.6163685917854309},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.5271294116973877},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.504768967628479},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4871046543121338},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.47835487127304077},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.4758194088935852},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.43852055072784424},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.42969274520874023},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36785823106765747},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3585846722126007},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3550637364387512},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3500880300998688},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33084818720817566},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.32638823986053467},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2023.3330920","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3330920","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7410564107","display_name":null,"funder_award_id":"62276150","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8215096727","display_name":null,"funder_award_id":"2021ZD0140407","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G8753403390","display_name":null,"funder_award_id":"62022048","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F3230804744","display_name":"Guoqiang Institute, Tsinghua University","ror":null},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":122,"referenced_works":["https://openalex.org/W1588539311","https://openalex.org/W2074231493","https://openalex.org/W2115252128","https://openalex.org/W2301937176","https://openalex.org/W2431101926","https://openalex.org/W2475295588","https://openalex.org/W2754447548","https://openalex.org/W2806833697","https://openalex.org/W2883127586","https://openalex.org/W2883183894","https://openalex.org/W2884460600","https://openalex.org/W2890581551","https://openalex.org/W2897039210","https://openalex.org/W2902266071","https://openalex.org/W2944294033","https://openalex.org/W2960274051","https://openalex.org/W2962770929","https://openalex.org/W2962793481","https://openalex.org/W2963163163","https://openalex.org/W2963168844","https://openalex.org/W2963290645","https://openalex.org/W2963408477","https://openalex.org/W2963516695","https://openalex.org/W2963626105","https://openalex.org/W2963917969","https://openalex.org/W2963966654","https://openalex.org/W2964024144","https://openalex.org/W2964313012","https://openalex.org/W2964559396","https://openalex.org/W2965289598","https://openalex.org/W2965503873","https://openalex.org/W2966421984","https://openalex.org/W2969985801","https://openalex.org/W2971634123","https://openalex.org/W2979894294","https://openalex.org/W2981033063","https://openalex.org/W2981860503","https://openalex.org/W2990375436","https://openalex.org/W2990452356","https://openalex.org/W3016155278","https://openalex.org/W3018564516","https://openalex.org/W3023885634","https://openalex.org/W3034371424","https://openalex.org/W3034463304","https://openalex.org/W3035316078","https://openalex.org/W3035574324","https://openalex.org/W3035575271","https://openalex.org/W3035592938","https://openalex.org/W3053644769","https://openalex.org/W3091653824","https://openalex.org/W3092775865","https://openalex.org/W3095289378","https://openalex.org/W3118580076","https://openalex.org/W3120742898","https://openalex.org/W3127393268","https://openalex.org/W3155375169","https://openalex.org/W3165405144","https://openalex.org/W3166255651","https://openalex.org/W3174807077","https://openalex.org/W3175035459","https://openalex.org/W3176032345","https://openalex.org/W3176913662","https://openalex.org/W3178284600","https://openalex.org/W3178406257","https://openalex.org/W3180770160","https://openalex.org/W3194230325","https://openalex.org/W3201739204","https://openalex.org/W3204680331","https://openalex.org/W3205688125","https://openalex.org/W3215495615","https://openalex.org/W4214626920","https://openalex.org/W4214926101","https://openalex.org/W4220834633","https://openalex.org/W4221143397","https://openalex.org/W4224035735","https://openalex.org/W4225101445","https://openalex.org/W4240592325","https://openalex.org/W4286611278","https://openalex.org/W4294306266","https://openalex.org/W4294541506","https://openalex.org/W4312283676","https://openalex.org/W4312301053","https://openalex.org/W4312740349","https://openalex.org/W4312828807","https://openalex.org/W4312913021","https://openalex.org/W4312933868","https://openalex.org/W4313145975","https://openalex.org/W4323891935","https://openalex.org/W4366308854","https://openalex.org/W4385245566","https://openalex.org/W4386071587","https://openalex.org/W4386074714","https://openalex.org/W4386076323","https://openalex.org/W4386373192","https://openalex.org/W6628877408","https://openalex.org/W6634221342","https://openalex.org/W6677618333","https://openalex.org/W6691096134","https://openalex.org/W6712884540","https://openalex.org/W6713645886","https://openalex.org/W6738465933","https://openalex.org/W6745829810","https://openalex.org/W6753914649","https://openalex.org/W6755102824","https://openalex.org/W6755298837","https://openalex.org/W6766759079","https://openalex.org/W6766978945","https://openalex.org/W6767264202","https://openalex.org/W6769148693","https://openalex.org/W6779093361","https://openalex.org/W6779823529","https://openalex.org/W6783713337","https://openalex.org/W6790019176","https://openalex.org/W6790978476","https://openalex.org/W6791353385","https://openalex.org/W6795288823","https://openalex.org/W6809396591","https://openalex.org/W6809885388","https://openalex.org/W6810241581","https://openalex.org/W6838785959","https://openalex.org/W6844305113","https://openalex.org/W6853666625"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W4394785709","https://openalex.org/W4309969736","https://openalex.org/W4380551139","https://openalex.org/W4317695495","https://openalex.org/W2770818364","https://openalex.org/W2953501176","https://openalex.org/W2965095304","https://openalex.org/W2470043383"],"abstract_inverted_index":{"The":[0],"existing":[1],"image-to-video":[2],"translation":[3,123],"methods":[4],"generally":[5],"follow":[6],"a":[7,17,35,49,59,127,139,154],"frame-by-frame":[8],"generative":[9,171],"paradigm,":[10],"while":[11],"extracting":[12],"the":[13,26,64,121,132,145,149,164,168,183,211,222,236],"temporal":[14,133],"information":[15,134],"from":[16],"reference":[18],"video":[19,62,76,86,128,146,170,194],"or":[20],"an":[21,46,74,111,158],"audio":[22],"stream.":[23],"Inspired":[24],"by":[25],"recent":[27],"success":[28],"in":[29,226],"text-guided":[30,169],"image":[31,47,65],"generation,":[32],"we":[33,71,107],"explore":[34],"more":[36],"challenging":[37],"but":[38],"promising":[39],"task,":[40],"Text-guided":[41],"Image-to-Video":[42],"(TI2V)":[43],"translation.":[44],"Given":[45],"and":[48,66,92,109,138,148,157,208,218,232],"brief":[50],"text":[51,150],"description":[52],"as":[53],"input,":[54],"TI2V":[55,104,122],"aims":[56],"to":[57,79,118,130,143,162,166,179,188,241],"generate":[58,80,242],"facial":[60,85,180,189],"expression":[61,90],"following":[63],"text.":[67],"To":[68],"this":[69],"end,":[70],"first":[72],"propose":[73],"automatic":[75],"captioning":[77],"pipeline":[78],"dense":[81,96],"textual":[82,97],"descriptions":[83,98],"for":[84,103],"datasets,":[87],"using":[88,213],"both":[89,229],"labels":[91],"action":[93],"units.":[94],"These":[95],"provide":[99],"precise":[100],"semantic":[101],"guidance":[102],"learning.":[105],"Then":[106],"design":[108,153],"train":[110,163],"efficient":[112],"framework,":[113],"FaceCLIP,":[114],"on":[115,245],"these":[116],"datasets":[117],"deal":[119],"with":[120,203],"task.":[124],"FaceCLIP":[125,202,225,240],"adopts":[126],"autoencoder":[129,165],"model":[131,142],"of":[135,224,228,239],"training":[136,198],"videos,":[137],"pretrained":[140],"CLIP":[141],"embed":[144],"frames":[147],"description.":[151],"We":[152,200],"reconstruction":[155,184],"loss":[156,161,185],"embedding":[159],"alignment":[160],"obtain":[167],"ability.":[172],"Recognizing":[173],"that":[174],"expressions":[175],"are":[176],"closely":[177],"tied":[178],"landmark":[181],"motions,":[182],"is":[186],"applied":[187],"landmarks":[190],"rather":[191],"than":[192],"each":[193],"frame,":[195],"significantly":[196],"enhancing":[197],"efficiency.":[199],"compare":[201],"several":[204],"potential":[205],"baseline":[206],"methods,":[207],"extensively":[209],"evaluate":[210],"performance":[212],"multiple":[214],"metrics.":[215],"Both":[216],"qualitative":[217],"quantitative":[219],"results":[220],"validate":[221],"superiority":[223],"terms":[227],"visual":[230],"quality":[231],"expression-text":[233],"consistency.":[234],"Moreover,":[235],"unique":[237],"ability":[238],"videos":[243],"based":[244],"abstract":[246],"texts":[247],"demonstrates":[248],"its":[249],"stronger":[250],"generalization":[251],"capability.":[252]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":4}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
