{"id":"https://openalex.org/W3096458759","doi":"https://doi.org/10.1109/ijcnn52387.2021.9533527","title":"DTGAN: Dual Attention Generative Adversarial Networks for Text-to-Image Generation","display_name":"DTGAN: Dual Attention Generative Adversarial Networks for Text-to-Image Generation","publication_year":2021,"publication_date":"2021-07-18","ids":{"openalex":"https://openalex.org/W3096458759","doi":"https://doi.org/10.1109/ijcnn52387.2021.9533527","mag":"3096458759"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn52387.2021.9533527","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9533527","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://research.rug.nl/en/publications/dbf1e751-857b-457b-b390-19ef2ee7f18f","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100605424","display_name":"Zhenxing Zhang","orcid":"https://orcid.org/0000-0003-2887-9873"},"institutions":[{"id":"https://openalex.org/I169381384","display_name":"University of Groningen","ror":"https://ror.org/012p63287","country_code":"NL","type":"education","lineage":["https://openalex.org/I169381384"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Zhenxing Zhang","raw_affiliation_strings":["Bernoulli Institute, University of Groningen,Groningen,The Netherlands","University of Groningen"],"affiliations":[{"raw_affiliation_string":"Bernoulli Institute, University of Groningen,Groningen,The Netherlands","institution_ids":["https://openalex.org/I169381384"]},{"raw_affiliation_string":"University of Groningen","institution_ids":["https://openalex.org/I169381384"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028858025","display_name":"Lambert Schomaker","orcid":"https://orcid.org/0000-0003-2351-930X"},"institutions":[{"id":"https://openalex.org/I169381384","display_name":"University of Groningen","ror":"https://ror.org/012p63287","country_code":"NL","type":"education","lineage":["https://openalex.org/I169381384"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Lambert Schomaker","raw_affiliation_strings":["Bernoulli Institute, University of Groningen,Groningen,The Netherlands","University of Groningen"],"affiliations":[{"raw_affiliation_string":"Bernoulli Institute, University of Groningen,Groningen,The Netherlands","institution_ids":["https://openalex.org/I169381384"]},{"raw_affiliation_string":"University of Groningen","institution_ids":["https://openalex.org/I169381384"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100605424"],"corresponding_institution_ids":["https://openalex.org/I169381384"],"apc_list":null,"apc_paid":null,"fwci":0.1938,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.45326656,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9847000241279602,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7914322018623352},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6630048751831055},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6362094283103943},{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.5943050384521484},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.5373007655143738},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.49747684597969055},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.4659591317176819},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.420045405626297},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41104692220687866},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3524476885795593}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7914322018623352},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6630048751831055},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6362094283103943},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.5943050384521484},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.5373007655143738},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.49747684597969055},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.4659591317176819},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.420045405626297},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41104692220687866},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3524476885795593},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.0}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.1109/ijcnn52387.2021.9533527","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9533527","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.rug.nl:publications/dbf1e751-857b-457b-b390-19ef2ee7f18f","is_oa":true,"landing_page_url":"https://research.rug.nl/en/publications/dbf1e751-857b-457b-b390-19ef2ee7f18f","pdf_url":null,"source":{"id":"https://openalex.org/S4306400420","display_name":"University of Groningen research database (University of Groningen / Centre for Information Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I169381384","host_organization_name":"University of Groningen","host_organization_lineage":["https://openalex.org/I169381384"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Zhang, Z & Schomaker, L 2021, DTGAN : Dual Attention Generative Adversarial Networks for Text-to-Image Generation. in 2021 International Joint Conference on Neural Networks (IJCNN). IEEE, 2021 International Joint Conference on Neural Networks (IJCNN), 18/07/2021. https://doi.org/10.1109/IJCNN52387.2021.9533527","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"mag:3096458759","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/2011.02709","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:pure.rug.nl:openaire_cris_publications/dbf1e751-857b-457b-b390-19ef2ee7f18f","is_oa":true,"landing_page_url":"https://hdl.handle.net/11370/dbf1e751-857b-457b-b390-19ef2ee7f18f","pdf_url":null,"source":{"id":"https://openalex.org/S4306400420","display_name":"University of Groningen research database (University of Groningen / Centre for Information Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I169381384","host_organization_name":"University of Groningen","host_organization_lineage":["https://openalex.org/I169381384"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Zhang, Z & Schomaker, L 2021, DTGAN : Dual Attention Generative Adversarial Networks for Text-to-Image Generation. in 2021 International Joint Conference on Neural Networks (IJCNN). IEEE, 2021 International Joint Conference on Neural Networks (IJCNN), 18/07/2021. https://doi.org/10.1109/IJCNN52387.2021.9533527","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:rug:oai:pure.rug.nl:publications/a166d6b2-c491-4655-8c0a-96b8a20763ef","is_oa":true,"landing_page_url":"https://research.rug.nl/en/publications/a166d6b2-c491-4655-8c0a-96b8a20763ef","pdf_url":null,"source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ArXiv. Cornell University Press","raw_type":"info:eu-repo/semantics/article"},{"id":"doi:10.48550/arxiv.2011.02709","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2011.02709","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:pure.rug.nl:publications/dbf1e751-857b-457b-b390-19ef2ee7f18f","is_oa":true,"landing_page_url":"https://research.rug.nl/en/publications/dbf1e751-857b-457b-b390-19ef2ee7f18f","pdf_url":null,"source":{"id":"https://openalex.org/S4306400420","display_name":"University of Groningen research database (University of Groningen / Centre for Information Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I169381384","host_organization_name":"University of Groningen","host_organization_lineage":["https://openalex.org/I169381384"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Zhang, Z & Schomaker, L 2021, DTGAN : Dual Attention Generative Adversarial Networks for Text-to-Image Generation. in 2021 International Joint Conference on Neural Networks (IJCNN). IEEE, 2021 International Joint Conference on Neural Networks (IJCNN), 18/07/2021. https://doi.org/10.1109/IJCNN52387.2021.9533527","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[{"score":0.7400000095367432,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320933","display_name":"Rijksuniversiteit Groningen","ror":"https://ror.org/012p63287"},{"id":"https://openalex.org/F4320337373","display_name":"Center for Information Technology","ror":"https://ror.org/03jh5a977"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1797268635","https://openalex.org/W1861492603","https://openalex.org/W2099471712","https://openalex.org/W2131774270","https://openalex.org/W2173520492","https://openalex.org/W2183341477","https://openalex.org/W2295107390","https://openalex.org/W2502312327","https://openalex.org/W2530372461","https://openalex.org/W2564591810","https://openalex.org/W2745461083","https://openalex.org/W2799062770","https://openalex.org/W2804078698","https://openalex.org/W2914190582","https://openalex.org/W2921224286","https://openalex.org/W2949117887","https://openalex.org/W2949999304","https://openalex.org/W2962845008","https://openalex.org/W2963163163","https://openalex.org/W2963373786","https://openalex.org/W2963402808","https://openalex.org/W2963403868","https://openalex.org/W2963413689","https://openalex.org/W2963521239","https://openalex.org/W2963612019","https://openalex.org/W2963966654","https://openalex.org/W2963981733","https://openalex.org/W2964024144","https://openalex.org/W2964216930","https://openalex.org/W2965289598","https://openalex.org/W2970127127","https://openalex.org/W2970971581","https://openalex.org/W2995910740","https://openalex.org/W3004349648","https://openalex.org/W3034655362","https://openalex.org/W3035284526","https://openalex.org/W3048484056","https://openalex.org/W6631190155","https://openalex.org/W6639102338","https://openalex.org/W6685352114","https://openalex.org/W6713645886","https://openalex.org/W6718379498","https://openalex.org/W6728889164","https://openalex.org/W6739901393","https://openalex.org/W6751546485","https://openalex.org/W6752378368","https://openalex.org/W6755310813","https://openalex.org/W6759785765","https://openalex.org/W6765779288","https://openalex.org/W6766150548","https://openalex.org/W6766978945","https://openalex.org/W6767278793","https://openalex.org/W6767384525","https://openalex.org/W6781951827"],"related_works":["https://openalex.org/W2995545297","https://openalex.org/W3048484056","https://openalex.org/W3012970712","https://openalex.org/W2984809863","https://openalex.org/W3097613717","https://openalex.org/W3000055254","https://openalex.org/W3111484932","https://openalex.org/W3162362121","https://openalex.org/W3047385447","https://openalex.org/W2784287200","https://openalex.org/W2964044605","https://openalex.org/W3033047436","https://openalex.org/W3194214700","https://openalex.org/W3090238363","https://openalex.org/W3088478528","https://openalex.org/W3206076554","https://openalex.org/W3009227557","https://openalex.org/W3105979354","https://openalex.org/W2798813225","https://openalex.org/W2981335848"],"abstract_inverted_index":{"Most":[0],"existing":[1],"text-to-image":[2],"generation":[3],"methods":[4],"adopt":[5],"a":[6,72,141,184],"multi-stage":[7,185],"modular":[8],"architecture":[9],"which":[10,62],"has":[11],"three":[12],"significant":[13],"problems:":[14],"1)":[15],"Training":[16],"multiple":[17],"networks":[18],"increases":[19],"the":[20,25,30,37,55,88,99,127,136,151,172,180],"run":[21],"time":[22],"and":[23,27,66,81,95,103,133,158],"affects":[24],"convergence":[26],"stability":[28],"of":[29,39,129,144,163,174],"generative":[31],"model;":[32],"2)":[33],"These":[34],"approaches":[35],"ignore":[36],"quality":[38],"early-stage":[40],"generator":[41,89],"images;":[42],"3)":[43],"Many":[44],"discriminators":[45],"need":[46],"to":[47,90,104,120,149,179],"be":[48],"trained.":[49],"To":[50],"this":[51],"end,":[52],"we":[53],"propose":[54],"Dual":[56],"Attention":[57],"Generative":[58],"Adversarial":[59],"Network":[60],"(DTGAN)":[61],"can":[63,86],"synthesize":[64],"high-quality":[65],"semantically":[67],"consistent":[68],"images":[69],"only":[70],"employing":[71],"single":[73],"generator/discriminator":[74],"pair.":[75],"The":[76],"proposed":[77,176],"model":[78],"introduces":[79],"channel-aware":[80],"pixel-aware":[82],"attention":[83,110,123],"modules":[84,124],"that":[85],"guide":[87],"focus":[91],"on":[92,98,168],"text-relevant":[93],"channels":[94],"pixels":[96],"based":[97],"global":[100],"sentence":[101],"vector":[102],"fine-tune":[105],"original":[106],"feature":[107],"maps":[108],"using":[109],"weights.":[111],"Also,":[112],"Conditional":[113],"Adaptive":[114],"Instance-Layer":[115],"Normalization":[116],"(CAdaILN)":[117],"is":[118,147],"presented":[119],"help":[121],"our":[122,175],"flexibly":[125],"control":[126],"amount":[128],"change":[130],"in":[131],"shape":[132,157],"texture":[134],"by":[135,154],"input":[137],"natural-language":[138],"description.":[139],"Furthermore,":[140],"new":[142],"type":[143],"visual":[145],"loss":[146],"utilized":[148],"enhance":[150],"image":[152],"resolution":[153],"ensuring":[155],"vivid":[156],"perceptually":[159],"uniform":[160],"color":[161],"distributions":[162],"generated":[164],"images.":[165],"Experimental":[166],"results":[167],"benchmark":[169],"datasets":[170],"demonstrate":[171],"superiority":[173],"method":[177],"compared":[178],"state-of-the-art":[181],"models":[182],"with":[183],"framework.":[186]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-21T08:13:44.787528","created_date":"2025-10-10T00:00:00"}
