{"id":"https://openalex.org/W4375850648","doi":"https://doi.org/10.1109/icassp49357.2023.10094932","title":"Designing A 3d-Aware Stylenerf Encoder for Face Editing","display_name":"Designing A 3d-Aware Stylenerf Encoder for Face Editing","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4375850648","doi":"https://doi.org/10.1109/icassp49357.2023.10094932"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10094932","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10094932","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100541272","display_name":"Songlin Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Songlin Yang","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Artificial Intelligence,Beijing,China","Center for Research on Intelligent Perception and Computing, NLPR, CASIA, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Artificial Intelligence,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Center for Research on Intelligent Perception and Computing, NLPR, CASIA, Beijing, China","institution_ids":["https://openalex.org/I4210112150"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100757829","display_name":"Wei Wang","orcid":"https://orcid.org/0000-0002-8598-0831"},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Wang","raw_affiliation_strings":["NLPR, CASIA,Center for Research on Intelligent Perception and Computing,Beijing,China","Center for Research on Intelligent Perception and Computing, NLPR, CASIA, Beijing, China"],"affiliations":[{"raw_affiliation_string":"NLPR, CASIA,Center for Research on Intelligent Perception and Computing,Beijing,China","institution_ids":["https://openalex.org/I4210090176"]},{"raw_affiliation_string":"Center for Research on Intelligent Perception and Computing, NLPR, CASIA, Beijing, China","institution_ids":["https://openalex.org/I4210112150"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026744328","display_name":"Bo Peng","orcid":"https://orcid.org/0000-0002-8539-180X"},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Peng","raw_affiliation_strings":["NLPR, CASIA,Center for Research on Intelligent Perception and Computing,Beijing,China","Center for Research on Intelligent Perception and Computing, NLPR, CASIA, Beijing, China"],"affiliations":[{"raw_affiliation_string":"NLPR, CASIA,Center for Research on Intelligent Perception and Computing,Beijing,China","institution_ids":["https://openalex.org/I4210090176"]},{"raw_affiliation_string":"Center for Research on Intelligent Perception and Computing, NLPR, CASIA, Beijing, China","institution_ids":["https://openalex.org/I4210112150"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017743261","display_name":"Jing Dong","orcid":"https://orcid.org/0000-0002-2763-7832"},"institutions":[{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Dong","raw_affiliation_strings":["NLPR, CASIA,Center for Research on Intelligent Perception and Computing,Beijing,China","Center for Research on Intelligent Perception and Computing, NLPR, CASIA, Beijing, China"],"affiliations":[{"raw_affiliation_string":"NLPR, CASIA,Center for Research on Intelligent Perception and Computing,Beijing,China","institution_ids":["https://openalex.org/I4210090176"]},{"raw_affiliation_string":"Center for Research on Intelligent Perception and Computing, NLPR, CASIA, Beijing, China","institution_ids":["https://openalex.org/I4210112150"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100541272"],"corresponding_institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210112150","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.6295,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.68505413,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8233082890510559},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.7984377145767212},{"id":"https://openalex.org/keywords/inversion","display_name":"Inversion (geology)","score":0.6040552258491516},{"id":"https://openalex.org/keywords/view-synthesis","display_name":"View synthesis","score":0.5303778052330017},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4972377121448517},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47763505578041077},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4677320420742035},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.459597647190094},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3372610807418823},{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.1229265034198761},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07340967655181885}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8233082890510559},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.7984377145767212},{"id":"https://openalex.org/C1893757","wikidata":"https://www.wikidata.org/wiki/Q3653001","display_name":"Inversion (geology)","level":3,"score":0.6040552258491516},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.5303778052330017},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4972377121448517},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47763505578041077},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4677320420742035},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.459597647190094},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3372610807418823},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.1229265034198761},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07340967655181885},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C109007969","wikidata":"https://www.wikidata.org/wiki/Q749565","display_name":"Structural basin","level":2,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10094932","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10094932","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2331128040","https://openalex.org/W2962770929","https://openalex.org/W2962785568","https://openalex.org/W2969985801","https://openalex.org/W3014852036","https://openalex.org/W3014859719","https://openalex.org/W3035574324","https://openalex.org/W3039828778","https://openalex.org/W3047371217","https://openalex.org/W3094954720","https://openalex.org/W3109585842","https://openalex.org/W3176179930","https://openalex.org/W3178406257","https://openalex.org/W3180794345","https://openalex.org/W3205325185","https://openalex.org/W4214622647","https://openalex.org/W4285124635","https://openalex.org/W4287817254","https://openalex.org/W4311034013","https://openalex.org/W4312301053","https://openalex.org/W4312453532","https://openalex.org/W4312536384","https://openalex.org/W4320013936","https://openalex.org/W4320458521","https://openalex.org/W6702130928","https://openalex.org/W6771275388","https://openalex.org/W6774631009","https://openalex.org/W6780879210","https://openalex.org/W6784825796","https://openalex.org/W6802668286","https://openalex.org/W6849955655"],"related_works":["https://openalex.org/W2611780867","https://openalex.org/W2731344982","https://openalex.org/W1491099440","https://openalex.org/W4390516098","https://openalex.org/W2073038808","https://openalex.org/W3104631102","https://openalex.org/W2181948922","https://openalex.org/W1983958657","https://openalex.org/W3010999348","https://openalex.org/W1971689240"],"abstract_inverted_index":{"GAN":[0,42,57,72],"inversion":[1,37,43,58,73],"has":[2],"been":[3],"exploited":[4],"in":[5,140],"many":[6],"face":[7,75,91,110,138],"manipulation":[8,139],"tasks,":[9],"but":[10],"2D":[11,25],"GANs":[12,26],"often":[13],"fail":[14],"to":[15,30,46,99,119],"generate":[16,100],"multi-view":[17],"3D":[18,33,49,90,136],"consistent":[19,137],"images.":[20],"The":[21],"encoders":[22],"designed":[23],"for":[24,35,71,149],"are":[27],"not":[28],"able":[29],"provide":[31],"sufficient":[32],"information":[34],"the":[36,48,55,79,121,154,166,170],"and":[38,74,103,127,145],"editing.":[39],"Therefore,":[40],"3D-aware":[41,56,68],"is":[44],"proposed":[45,84],"increase":[47],"editing":[50,76,144],"capability":[51],"of":[52,156,169],"GANs.":[53],"However,":[54],"remains":[59],"under-explored.":[60],"To":[61],"tackle":[62],"this":[63],"problem,":[64],"we":[65,112,134,152],"propose":[66],"a":[67,88,94,115,160],"(3Da)":[69],"encoder":[70,86],"based":[77],"on":[78],"powerful":[80],"StyleNeRF":[81,122],"model.":[82],"Our":[83],"3Da":[85],"combines":[87],"parametric":[89],"model":[92,98],"with":[93,124],"learnable":[95],"detail":[96],"representation":[97],"geometry,":[101],"texture":[102,128,146],"view":[104],"direction":[105],"codes.":[106],"For":[107],"more":[108],"flexible":[109],"manipulation,":[111],"then":[113],"design":[114],"dual-branch":[116],"StyleFlow":[117],"module":[118],"transfer":[120],"codes":[123,158],"disentangled":[125],"geometry":[126],"flows.":[129],"Extensive":[130],"experiments":[131],"demonstrate":[132],"that":[133],"realize":[135],"both":[141],"facial":[142],"attribute":[143],"transfer.":[147],"Furthermore,":[148],"video":[150],"editing,":[151],"make":[153],"sequence":[155],"frame":[157],"share":[159],"common":[161],"canonical":[162],"manifold,":[163],"which":[164],"improves":[165],"temporal":[167],"consistency":[168],"edited":[171],"attributes.":[172]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
