{"id":"https://openalex.org/W4304099305","doi":"https://doi.org/10.1145/3503161.3547758","title":"Towards Open-Ended Text-to-Face Generation, Combination and Manipulation","display_name":"Towards Open-Ended Text-to-Face Generation, Combination and Manipulation","publication_year":2022,"publication_date":"2022-10-10","ids":{"openalex":"https://openalex.org/W4304099305","doi":"https://doi.org/10.1145/3503161.3547758"},"language":"en","primary_location":{"id":"doi:10.1145/3503161.3547758","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3503161.3547758","pdf_url":null,"source":{"id":"https://openalex.org/S4363608757","display_name":"Proceedings of the 30th ACM International Conference on Multimedia","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101817133","display_name":"Jun Peng","orcid":"https://orcid.org/0000-0003-0655-1594"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Peng","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114035137","display_name":"Han Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Han Pan","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091531008","display_name":"Yiyi Zhou","orcid":"https://orcid.org/0000-0002-5110-4526"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yiyi Zhou","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109506594","display_name":"Jing He","orcid":"https://orcid.org/0000-0001-6867-4122"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing He","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059926864","display_name":"Xiaoshuai Sun","orcid":"https://orcid.org/0000-0003-3912-9306"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoshuai Sun","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101846033","display_name":"Yan Wang","orcid":"https://orcid.org/0000-0003-4309-3166"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan Wang","raw_affiliation_strings":["Pinterest, Seattle, WA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Pinterest, Seattle, WA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100716576","display_name":"Yongjian Wu","orcid":"https://orcid.org/0000-0003-2007-6929"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongjian Wu","raw_affiliation_strings":["Tencent Youtu Lab, Shanghai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent Youtu Lab, Shanghai, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016080094","display_name":"Rongrong Ji","orcid":"https://orcid.org/0000-0001-9163-2932"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rongrong Ji","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4129,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.70618301,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5045","last_page":"5054"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8389184474945068},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5286964178085327},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.5286498665809631},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.5069242119789124},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.501887321472168},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.48808515071868896},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.48346906900405884},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47920331358909607},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.46783533692359924},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.46580392122268677},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.4462757706642151},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.36381465196609497},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3440559506416321},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.21969828009605408},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.17556336522102356}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8389184474945068},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5286964178085327},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.5286498665809631},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.5069242119789124},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.501887321472168},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.48808515071868896},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.48346906900405884},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47920331358909607},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.46783533692359924},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.46580392122268677},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.4462757706642151},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.36381465196609497},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3440559506416321},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.21969828009605408},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.17556336522102356},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3503161.3547758","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3503161.3547758","pdf_url":null,"source":{"id":"https://openalex.org/S4363608757","display_name":"Proceedings of the 30th ACM International Conference on Multimedia","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1656144382","display_name":null,"funder_award_id":"No.62025603","funder_id":"https://openalex.org/F4320336125","funder_display_name":"National Science Fund for Distinguished Young Scholars"},{"id":"https://openalex.org/G3257909562","display_name":null,"funder_award_id":"No.U1705262, No.62176222, No.62176223, No.62176226, No.62072386, No.62072387, No.62072389, No.62002305, No.61772443, No.61802324 and No.61702136","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4217974285","display_name":null,"funder_award_id":"No.20720200077, No.20720200090 and No.20720200091","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null},{"id":"https://openalex.org/F4320336125","display_name":"National Science Fund for Distinguished Young Scholars","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W1834627138","https://openalex.org/W2079735306","https://openalex.org/W2117539524","https://openalex.org/W2183341477","https://openalex.org/W2962770929","https://openalex.org/W2962785568","https://openalex.org/W2963966654","https://openalex.org/W2964024144","https://openalex.org/W2966792645","https://openalex.org/W2994303421","https://openalex.org/W3034431451","https://openalex.org/W3035097537","https://openalex.org/W3035316078","https://openalex.org/W3035574324","https://openalex.org/W3048372515","https://openalex.org/W3048484056","https://openalex.org/W3092673631","https://openalex.org/W3093025045","https://openalex.org/W3095707326","https://openalex.org/W3103667010","https://openalex.org/W3120992250","https://openalex.org/W3173241699","https://openalex.org/W3174194560","https://openalex.org/W3177221875","https://openalex.org/W3178406257","https://openalex.org/W3191739452","https://openalex.org/W3203312420","https://openalex.org/W3207865986","https://openalex.org/W4214540501","https://openalex.org/W4214622647","https://openalex.org/W4214926101","https://openalex.org/W4224304134","https://openalex.org/W4226055713"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3005996785","https://openalex.org/W3014948380","https://openalex.org/W4386984417","https://openalex.org/W4380551139","https://openalex.org/W4317695495","https://openalex.org/W4287117424","https://openalex.org/W4387506531","https://openalex.org/W2087346071","https://openalex.org/W2967848559"],"abstract_inverted_index":{"Text-to-face":[0],"(T2F)":[1],"generation":[2],"is":[3,61],"an":[4,71,115],"emerging":[5],"research":[6],"hot":[7],"spot":[8],"in":[9,16,33,43,206,221],"multimedia,":[10],"and":[11,45,96,103,149,188,210],"its":[12,218],"main":[13],"challenge":[14],"lies":[15],"the":[17,30,79,91,98,111,145,151,172,196,202,222],"high":[18],"fidelity":[19],"requirement":[20],"of":[21,101,117,174,199],"generated":[22],"portraits.":[23],"Many":[24],"existing":[25,66,203],"works":[26],"resort":[27],"to":[28,142,201],"exploring":[29],"latent":[31,74,147],"space":[32,75],"a":[34,53,84,138],"pre-trained":[35],"generator,":[36],"e.g.,":[37,119],"StyleGAN,":[38],"which":[39,60],"has":[40],"obvious":[41],"shortcomings":[42],"efficiency":[44,173],"generalization":[46],"ability.":[47],"In":[48,134],"this":[49],"paper,":[50],"we":[51,127,136],"propose":[52,137],"generative":[54],"network":[55],"for":[56,161],"open-ended":[57,102],"text-to-face":[58],"generation,":[59],"termed":[62],"OpenFaceGAN.":[63],"Differing":[64],"from":[65],"StyleGAN-based":[67],"methods,":[68],"OpenFaceGAN":[69,158,200],"constructs":[70],"effective":[72],"multi-modal":[73],"that":[76],"directly":[77,159],"converts":[78],"natural":[80],"language":[81],"description":[82],"into":[83],"face.":[85],"This":[86],"mapping":[87],"paradigm":[88],"can":[89],"fit":[90],"real":[92],"data":[93],"distribution":[94],"well":[95],"make":[97],"model":[99],"capable":[100],"even":[104],"zero-shot":[105,223],"T2F":[106,204],"generation.":[107,224],"Our":[108],"method":[109],"improves":[110],"inference":[112],"speed":[113],"by":[114],"order":[116],"magnitude,":[118],"294":[120],"times":[121],"than":[122],"TediGAN.":[123],"Based":[124],"on":[125,181],"OpenFaceGAN,":[126],"further":[128],"explore":[129],"text-guided":[130],"face":[131,175],"manipulation":[132,163],"(editing).":[133],"particular,":[135],"parameterized":[139],"module,":[140],"OpenEditor,":[141],"automatically":[143],"disentangle":[144],"target":[146],"code":[148],"update":[150],"original":[152],"style":[153],"information.":[154],"OpenEditor":[155],"also":[156,215],"makes":[157],"applicable":[160],"most":[162],"instructions":[164],"without":[165],"example-dependent":[166],"searches":[167],"or":[168],"optimizations,":[169],"greatly":[170,216],"improving":[171],"manipulation.":[176],"We":[177],"conduct":[178],"extensive":[179],"experiments":[180],"two":[182],"benchmark":[183],"datasets":[184],"namely":[185],"Multi-Modal":[186],"CelebA-HQ":[187],"Face2Text-v1.0.":[189],"The":[190],"experimental":[191],"results":[192],"not":[193],"only":[194],"show":[195],"superior":[197],"performance":[198],"methods":[205],"both":[207],"image":[208],"quality":[209],"image-text":[211],"matching":[212],"degree":[213],"but":[214],"confirm":[217],"outstanding":[219],"ability":[220],"Codes":[225],"will":[226],"be":[227],"released":[228],"at:":[229],"\\textcolormagenta":[230],"\\urlhttps://github.com/pengjunn/OpenFace":[231]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
