{"id":"https://openalex.org/W4283705858","doi":"https://doi.org/10.1109/tpami.2022.3186752","title":"Label-Guided Generative Adversarial Network for Realistic Image Synthesis","display_name":"Label-Guided Generative Adversarial Network for Realistic Image Synthesis","publication_year":2022,"publication_date":"2022-06-28","ids":{"openalex":"https://openalex.org/W4283705858","doi":"https://doi.org/10.1109/tpami.2022.3186752","pmid":"https://pubmed.ncbi.nlm.nih.gov/35763471"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2022.3186752","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3186752","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087225139","display_name":"Junchen Zhu","orcid":"https://orcid.org/0000-0002-3872-6689"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Junchen Zhu","raw_affiliation_strings":["Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-3872-6689","affiliations":[{"raw_affiliation_string":"Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066645546","display_name":"Lianli Gao","orcid":"https://orcid.org/0000-0002-2522-6394"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lianli Gao","raw_affiliation_strings":["Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-2522-6394","affiliations":[{"raw_affiliation_string":"Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036987388","display_name":"Jingkuan Song","orcid":"https://orcid.org/0000-0002-2549-8322"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingkuan Song","raw_affiliation_strings":["Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-2549-8322","affiliations":[{"raw_affiliation_string":"Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017943466","display_name":"Yuan-Fang Li","orcid":"https://orcid.org/0000-0003-4651-2821"},"institutions":[{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Yuan-Fang Li","raw_affiliation_strings":["Faculty of Information Technology, Monash University, Clayton, VIC, Australia"],"raw_orcid":"https://orcid.org/0000-0003-4651-2821","affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Monash University, Clayton, VIC, Australia","institution_ids":["https://openalex.org/I56590836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063285882","display_name":"Feng Zheng","orcid":"https://orcid.org/0000-0002-1701-9141"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]},{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU","CN"],"is_corresponding":false,"raw_author_name":"Feng Zheng","raw_affiliation_strings":["Faculty of Information Technology, Monash University, Clayton, VIC, Australia","Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-1701-9141","affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Monash University, Clayton, VIC, Australia","institution_ids":["https://openalex.org/I56590836"]},{"raw_affiliation_string":"Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106943753","display_name":"Xuelong Li","orcid":"https://orcid.org/0000-0003-2924-946X"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]},{"id":"https://openalex.org/I890469752","display_name":"Ministry of Industry and Information Technology","ror":"https://ror.org/0385nmy68","country_code":"CN","type":"government","lineage":["https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuelong Li","raw_affiliation_strings":["School of Artificial Intelligence, OPtics and ElectroNics (iOPEN), Northwestern Polytechnical University, Xi&#x0027;an, China","an, P. R. China","Key Laboratory of Intelligent Interaction and Applications (Northwestern Polytechnical University), Ministry of Industry and Information Technology, Xi&#x2019"],"raw_orcid":"https://orcid.org/0000-0003-2924-946X","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, OPtics and ElectroNics (iOPEN), Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"an, P. R. China","institution_ids":[]},{"raw_affiliation_string":"Key Laboratory of Intelligent Interaction and Applications (Northwestern Polytechnical University), Ministry of Industry and Information Technology, Xi&#x2019","institution_ids":["https://openalex.org/I17145004","https://openalex.org/I890469752"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052993469","display_name":"Heng Tao Shen","orcid":"https://orcid.org/0000-0002-2999-2088"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heng Tao Shen","raw_affiliation_strings":["Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-2999-2088","affiliations":[{"raw_affiliation_string":"Future Media Center and School of Computer Science and Engineering, The University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5087225139"],"corresponding_institution_ids":["https://openalex.org/I150229711"],"apc_list":null,"apc_paid":null,"fwci":2.2449,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.8929263,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"45","issue":"3","first_page":"3311","last_page":"3328"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8090975284576416},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7241337895393372},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.7176090478897095},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.5455282926559448},{"id":"https://openalex.org/keywords/image-translation","display_name":"Image translation","score":0.5257276296615601},{"id":"https://openalex.org/keywords/generative-adversarial-network","display_name":"Generative adversarial network","score":0.5183109045028687},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5085495710372925},{"id":"https://openalex.org/keywords/semantic-gap","display_name":"Semantic gap","score":0.484954833984375},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.44985684752464294},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.35293757915496826},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.2746349573135376}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8090975284576416},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7241337895393372},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.7176090478897095},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.5455282926559448},{"id":"https://openalex.org/C2779757391","wikidata":"https://www.wikidata.org/wiki/Q6002292","display_name":"Image translation","level":3,"score":0.5257276296615601},{"id":"https://openalex.org/C2988773926","wikidata":"https://www.wikidata.org/wiki/Q25104379","display_name":"Generative adversarial network","level":3,"score":0.5183109045028687},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5085495710372925},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.484954833984375},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.44985684752464294},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35293757915496826},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.2746349573135376},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2022.3186752","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3186752","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:35763471","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35763471","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.7200000286102295,"id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G2546663186","display_name":null,"funder_award_id":"62020106008","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4820425477","display_name":null,"funder_award_id":"61871470","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6864684409","display_name":null,"funder_award_id":"62122018","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7314976618","display_name":null,"funder_award_id":"61872064","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8027008232","display_name":null,"funder_award_id":"61772116","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":63,"referenced_works":["https://openalex.org/W189587150","https://openalex.org/W1522301498","https://openalex.org/W1901129140","https://openalex.org/W1903029394","https://openalex.org/W2108598243","https://openalex.org/W2125389028","https://openalex.org/W2133665775","https://openalex.org/W2183341477","https://openalex.org/W2412782625","https://openalex.org/W2475287302","https://openalex.org/W2535388113","https://openalex.org/W2561196672","https://openalex.org/W2603777577","https://openalex.org/W2737258237","https://openalex.org/W2799062770","https://openalex.org/W2808062989","https://openalex.org/W2883376126","https://openalex.org/W2884466206","https://openalex.org/W2884822772","https://openalex.org/W2890404842","https://openalex.org/W2903838325","https://openalex.org/W2910065734","https://openalex.org/W2950689937","https://openalex.org/W2952773607","https://openalex.org/W2962770929","https://openalex.org/W2962793481","https://openalex.org/W2962850830","https://openalex.org/W2962974533","https://openalex.org/W2963073614","https://openalex.org/W2963163163","https://openalex.org/W2963444790","https://openalex.org/W2963470893","https://openalex.org/W2963522749","https://openalex.org/W2963561004","https://openalex.org/W2963767194","https://openalex.org/W2963800363","https://openalex.org/W2963890275","https://openalex.org/W2964217532","https://openalex.org/W2969676068","https://openalex.org/W2983248633","https://openalex.org/W2983484869","https://openalex.org/W3035083401","https://openalex.org/W3035316078","https://openalex.org/W3035574324","https://openalex.org/W3093190933","https://openalex.org/W3115000224","https://openalex.org/W4246193833","https://openalex.org/W4300479382","https://openalex.org/W6621378261","https://openalex.org/W6631190155","https://openalex.org/W6637373629","https://openalex.org/W6678815747","https://openalex.org/W6730095352","https://openalex.org/W6734074887","https://openalex.org/W6745560452","https://openalex.org/W6752378368","https://openalex.org/W6755102824","https://openalex.org/W6755312952","https://openalex.org/W6757842588","https://openalex.org/W6758276651","https://openalex.org/W6765779288","https://openalex.org/W6767457696","https://openalex.org/W6779841522"],"related_works":["https://openalex.org/W2904616728","https://openalex.org/W3119479239","https://openalex.org/W4388937044","https://openalex.org/W2903477224","https://openalex.org/W3198510459","https://openalex.org/W4200417262","https://openalex.org/W3005996785","https://openalex.org/W4282977492","https://openalex.org/W2914450692","https://openalex.org/W3178813832"],"abstract_inverted_index":{"Generating":[0],"photo-realistic":[1],"images":[2],"from":[3,45,54],"labels":[4,7,30,67],"(e.g.,":[5],"semantic":[6,104],"or":[8],"sketch":[9],"labels)":[10],"is":[11,165],"much":[12],"more":[13],"challenging":[14],"than":[15],"the":[16,24,55,63,66,79,99,102,109,121,133,153,178],"general":[17,38],"image-to-image":[18],"translation":[19],"task,":[20],"mainly":[21],"due":[22],"to":[23,41,50,60,77,119,149],"large":[25,94],"differences":[26],"between":[27,65],"extremely":[28],"sparse":[29],"and":[31,57,68,89,160,186,205],"detail":[32],"rich":[33],"images.":[34,69],"We":[35,173],"propose":[36,72,113],"a":[37,73,161],"framework":[39],"Lab2Pix":[40,176],"tackle":[42],"this":[43],"issue":[44],"two":[46],"aspects:":[47],"1)":[48],"how":[49,59],"extract":[51],"useful":[52],"information":[53,126],"input;":[56],"2)":[58],"efficiently":[61,107],"bridge":[62],"gap":[64],"Specifically,":[70],"we":[71,111],"Double-Guided":[74],"Normalization":[75],"(DG-Norm)":[76],"use":[78,90],"input":[80],"label":[81],"for":[82,97,168,177],"semantically":[83],"guiding":[84],"activations":[85,100],"in":[86,136,182,207],"normalization":[87],"layers,":[88],"global":[91],"features":[92],"with":[93,143],"receptive":[95],"fields":[96],"differentiating":[98],"within":[101],"same":[103],"region.":[105],"To":[106],"generate":[108],"images,":[110],"further":[112,166],"Label":[114],"Guided":[115],"Spatial":[116],"Co-Attention":[117],"(LSCA)":[118],"encourage":[120],"learning":[122],"of":[123,180],"incremental":[124],"visual":[125],"using":[127],"limited":[128],"model":[129],"parameters":[130],"while":[131],"storing":[132],"well-synthesized":[134],"part":[135],"lower-level":[137],"features.":[138],"Accordingly,":[139],"Hierarchical":[140],"Perceptual":[141],"Discriminators":[142],"Foreground":[144],"Enhancement":[145],"Masks":[146],"are":[147],"proposed":[148],"toughly":[150],"work":[151],"against":[152],"generator":[154],"thus":[155],"encouraging":[156],"realistic":[157],"image":[158,171],"generation":[159],"sharp":[162,170],"enhancement":[163],"loss":[164],"introduced":[167],"high-quality":[169],"generation.":[172],"instantiate":[174],"our":[175,198],"task":[179],"label-to-image":[181],"both":[183,208],"unpaired":[184],"(Lab2Pix-V1)":[185],"paired":[187],"settings":[188],"(Lab2Pix-V2).":[189],"Extensive":[190],"experiments":[191],"conducted":[192],"on":[193],"various":[194],"datasets":[195],"demonstrate":[196],"that":[197],"method":[199],"significantly":[200],"outperforms":[201],"state-of-the-art":[202],"methods":[203],"quantitatively":[204],"qualitatively":[206],"settings.":[209]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
