{"id":"https://openalex.org/W4389109089","doi":"https://doi.org/10.1145/3628454.3631665","title":"Attention-driven Text-guided Image Manipulation","display_name":"Attention-driven Text-guided Image Manipulation","publication_year":2023,"publication_date":"2023-11-28","ids":{"openalex":"https://openalex.org/W4389109089","doi":"https://doi.org/10.1145/3628454.3631665"},"language":"en","primary_location":{"id":"doi:10.1145/3628454.3631665","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3628454.3631665","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Conference on Advances in Information Technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111082241","display_name":"Jiayu Su","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112116","display_name":"Mianyang City Center for Disease Control and Prevention","ror":"https://ror.org/020w9yc61","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210112116"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiayu Su","raw_affiliation_strings":["Mianyang City College, China"],"affiliations":[{"raw_affiliation_string":"Mianyang City College, China","institution_ids":["https://openalex.org/I4210112116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019348755","display_name":"Zhiqiang Zhang","orcid":"https://orcid.org/0000-0002-2408-366X"},"institutions":[{"id":"https://openalex.org/I1297991670","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474","country_code":"CN","type":"education","lineage":["https://openalex.org/I1297991670"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiqiang Zhang","raw_affiliation_strings":["Southwest University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"Southwest University of Science and Technology, China","institution_ids":["https://openalex.org/I1297991670"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102793173","display_name":"Qiang Han","orcid":"https://orcid.org/0009-0007-1137-3557"},"institutions":[{"id":"https://openalex.org/I102345215","display_name":"Xihua University","ror":"https://ror.org/04gwtvf26","country_code":"CN","type":"education","lineage":["https://openalex.org/I102345215"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Han","raw_affiliation_strings":["Xihua University, China"],"affiliations":[{"raw_affiliation_string":"Xihua University, China","institution_ids":["https://openalex.org/I102345215"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024674930","display_name":"Xin Cheng","orcid":"https://orcid.org/0000-0002-3892-2727"},"institutions":[{"id":"https://openalex.org/I204291657","display_name":"Hosei University","ror":"https://ror.org/00bx6dj65","country_code":"JP","type":"education","lineage":["https://openalex.org/I204291657"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Xin Cheng","raw_affiliation_strings":["Hosei University, Japan"],"affiliations":[{"raw_affiliation_string":"Hosei University, Japan","institution_ids":["https://openalex.org/I204291657"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062070683","display_name":"Wanlin Zhao","orcid":"https://orcid.org/0009-0008-3394-2754"},"institutions":[{"id":"https://openalex.org/I4210142656","display_name":"Instrumentation Technology and Economy Institute","ror":"https://ror.org/04983b693","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210142656"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wanlin Zhao","raw_affiliation_strings":["Instrumentation Technology and Economy Institute, China"],"affiliations":[{"raw_affiliation_string":"Instrumentation Technology and Economy Institute, China","institution_ids":["https://openalex.org/I4210142656"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100691161","display_name":"Wei Zhang","orcid":"https://orcid.org/0000-0002-5205-9368"},"institutions":[{"id":"https://openalex.org/I1297991670","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474","country_code":"CN","type":"education","lineage":["https://openalex.org/I1297991670"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Zhang","raw_affiliation_strings":["Southwest University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"Southwest University of Science and Technology, China","institution_ids":["https://openalex.org/I1297991670"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049814360","display_name":"Wenxin Yu","orcid":"https://orcid.org/0000-0002-6093-5516"},"institutions":[{"id":"https://openalex.org/I1297991670","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474","country_code":"CN","type":"education","lineage":["https://openalex.org/I1297991670"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenxin Yu","raw_affiliation_strings":["Southwest University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"Southwest University of Science and Technology, China","institution_ids":["https://openalex.org/I1297991670"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5111082241"],"corresponding_institution_ids":["https://openalex.org/I4210112116"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.15561251,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/image-manipulation","display_name":"Image manipulation","score":0.7799662351608276},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7718629837036133},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.6859161853790283},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6086726784706116},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5989466905593872},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5898197293281555},{"id":"https://openalex.org/keywords/image-quality","display_name":"Image quality","score":0.5404795408248901},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.506862461566925},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4998929500579834}],"concepts":[{"id":"https://openalex.org/C2987933465","wikidata":"https://www.wikidata.org/wiki/Q141130","display_name":"Image manipulation","level":3,"score":0.7799662351608276},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7718629837036133},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.6859161853790283},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6086726784706116},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5989466905593872},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5898197293281555},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.5404795408248901},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.506862461566925},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4998929500579834},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3628454.3631665","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3628454.3631665","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Conference on Advances in Information Technology","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.44999998807907104}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W2131774270","https://openalex.org/W2183341477","https://openalex.org/W2962845008","https://openalex.org/W2963163163","https://openalex.org/W2963966654","https://openalex.org/W2964024144","https://openalex.org/W2964313012"],"related_works":["https://openalex.org/W2949816130","https://openalex.org/W2096230562","https://openalex.org/W2225239186","https://openalex.org/W2037030319","https://openalex.org/W4307186884","https://openalex.org/W3183170284","https://openalex.org/W2042193908","https://openalex.org/W2788541584","https://openalex.org/W2572781942","https://openalex.org/W4226341727"],"abstract_inverted_index":{"The":[0,104],"main":[1],"content":[2,19],"of":[3,12,40,63,79,91,128],"Text-guided":[4],"Image":[5],"Manipulation":[6],"(TGIM)":[7],"research":[8,31],"is":[9,56,107],"the":[10,17,21,38,61,67,76,83,89,118,125,129,136,140,144],"use":[11],"textual":[13],"information":[14],"to":[15,45,58,74,98,135],"modify":[16],"corresponding":[18],"in":[20],"input":[22],"image.":[23],"Based":[24],"on":[25,110,132],"generative":[26],"adversarial":[27],"networks":[28],"(GAN),":[29],"this":[30,50],"has":[32],"achieved":[33],"impressive":[34],"manipulation":[35,42,81,93,102],"performance.":[36],"Nevertheless,":[37],"quality":[39,62,90],"image":[41,64,80,92,101],"still":[43],"needs":[44],"be":[46,95],"further":[47,59],"improved.":[48],"In":[49],"paper,":[51],"an":[52,71],"attention-driven":[53],"TGIM":[54,138],"method":[55,69,106,131,142],"proposed":[57,68,105,130,141],"improve":[60],"manipulation.":[65],"Specifically,":[66],"uses":[70],"attention":[72],"mechanism":[73],"fine-tune":[75],"whole":[77],"process":[78],"at":[82],"word":[84],"level.":[85],"Through":[86],"attentional":[87],"fine-tuning,":[88],"can":[94],"continuously":[96],"improved":[97],"realize":[99],"high-quality":[100],"effects.":[103],"experimentally":[108],"validated":[109],"a":[111],"public":[112],"Caltech-UCSD":[113],"birds-200-2011":[114],"(CUB)":[115],"dataset,":[116],"and":[117,120,150],"qualitative":[119],"quantitative":[121],"comparison":[122],"results":[123],"demonstrate":[124],"superior":[126],"performance":[127],"TGIM.":[133],"Compared":[134],"existing":[137],"methods,":[139],"improves":[143],"Inception":[145,153],"Score":[146],"(IS)":[147],"by":[148,156],"22.6%":[149],"reduces":[151],"Fr\u00e9chet":[152],"Distance":[154],"(FID)":[155],"13.4%.":[157]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
