{"id":"https://openalex.org/W3093122931","doi":"https://doi.org/10.1145/3394171.3413551","title":"Sequential Attention GAN for Interactive Image Editing","display_name":"Sequential Attention GAN for Interactive Image Editing","publication_year":2020,"publication_date":"2020-10-12","ids":{"openalex":"https://openalex.org/W3093122931","doi":"https://doi.org/10.1145/3394171.3413551","mag":"3093122931"},"language":"en","primary_location":{"id":"doi:10.1145/3394171.3413551","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3394171.3413551","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101580523","display_name":"Yu Cheng","orcid":"https://orcid.org/0000-0002-7901-8662"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yu Cheng","raw_affiliation_strings":["Microsoft Dynamics 365 AI Research, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Dynamics 365 AI Research, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066666034","display_name":"Zhe Gan","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhe Gan","raw_affiliation_strings":["Microsoft Dynamics 365 AI Research, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Dynamics 365 AI Research, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100413888","display_name":"Yitong Li","orcid":"https://orcid.org/0009-0009-3874-6055"},"institutions":[{"id":"https://openalex.org/I170897317","display_name":"Duke University","ror":"https://ror.org/00py81415","country_code":"US","type":"education","lineage":["https://openalex.org/I170897317"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yitong Li","raw_affiliation_strings":["Duke University, Durham, NC, USA"],"affiliations":[{"raw_affiliation_string":"Duke University, Durham, NC, USA","institution_ids":["https://openalex.org/I170897317"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100442542","display_name":"Jingjing Liu","orcid":"https://orcid.org/0009-0002-6277-5816"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jingjing Liu","raw_affiliation_strings":["Microsoft Dynamics 365 AI Research, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Dynamics 365 AI Research, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047233371","display_name":"Jianfeng Gao","orcid":"https://orcid.org/0000-0002-6371-505X"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jianfeng Gao","raw_affiliation_strings":["Microsoft Research, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101580523"],"corresponding_institution_ids":["https://openalex.org/I1290206253"],"apc_list":null,"apc_paid":null,"fwci":4.5142,"has_fulltext":false,"cited_by_count":71,"citation_normalized_percentile":{"value":0.95841505,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"4383","last_page":"4391"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9704999923706055,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8625432252883911},{"id":"https://openalex.org/keywords/session","display_name":"Session (web analytics)","score":0.6182239055633545},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5772479772567749},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5745649337768555},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.565970242023468},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5357840061187744},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5313559174537659},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5044797658920288},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.48877593874931335},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.4862626791000366},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.4439142346382141},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.32209500670433044}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8625432252883911},{"id":"https://openalex.org/C2779182362","wikidata":"https://www.wikidata.org/wiki/Q17126187","display_name":"Session (web analytics)","level":2,"score":0.6182239055633545},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5772479772567749},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5745649337768555},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.565970242023468},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5357840061187744},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5313559174537659},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5044797658920288},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.48877593874931335},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.4862626791000366},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.4439142346382141},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.32209500670433044},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3394171.3413551","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3394171.3413551","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4099999964237213,"display_name":"Responsible consumption and production","id":"https://metadata.un.org/sdg/12"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W1924770834","https://openalex.org/W1933349210","https://openalex.org/W2024539680","https://openalex.org/W2093848332","https://openalex.org/W2108598243","https://openalex.org/W2141708418","https://openalex.org/W2194775991","https://openalex.org/W2247513039","https://openalex.org/W2298992465","https://openalex.org/W2302548814","https://openalex.org/W2471768434","https://openalex.org/W2548275288","https://openalex.org/W2558809543","https://openalex.org/W2560481159","https://openalex.org/W2583186419","https://openalex.org/W2617322972","https://openalex.org/W2735001949","https://openalex.org/W2774015909","https://openalex.org/W2774397635","https://openalex.org/W2788768663","https://openalex.org/W2808162831","https://openalex.org/W2889077639","https://openalex.org/W2891417743","https://openalex.org/W2962793481","https://openalex.org/W2962883855","https://openalex.org/W2963047368","https://openalex.org/W2963073614","https://openalex.org/W2963145877","https://openalex.org/W2963184176","https://openalex.org/W2963201933","https://openalex.org/W2963389687","https://openalex.org/W2963420272","https://openalex.org/W2963636184","https://openalex.org/W2963966654","https://openalex.org/W2964024144","https://openalex.org/W2964318046","https://openalex.org/W2965833116","https://openalex.org/W2987919422","https://openalex.org/W3035083401","https://openalex.org/W3088653102","https://openalex.org/W3098232790","https://openalex.org/W4249013746","https://openalex.org/W6712785310","https://openalex.org/W6713645886","https://openalex.org/W6734074887","https://openalex.org/W6745992979","https://openalex.org/W6746893431","https://openalex.org/W6751039726"],"related_works":["https://openalex.org/W2468279273","https://openalex.org/W2354198838","https://openalex.org/W1989130879","https://openalex.org/W2103419012","https://openalex.org/W2378211422","https://openalex.org/W2988126442","https://openalex.org/W2745001401","https://openalex.org/W4321353415","https://openalex.org/W1974414866","https://openalex.org/W2130974462"],"abstract_inverted_index":{"Most":[0],"existing":[1],"text-to-image":[2],"synthesis":[3],"tasks":[4],"are":[5,90],"static":[6],"single-turn":[7],"generation,":[8],"based":[9],"on":[10,197,221,233],"pre-defined":[11],"textual":[12,44,102,147],"descriptions":[13],"of":[14,152,165],"images.":[15],"To":[16,120,180,195],"explore":[17],"more":[18],"practical":[19],"and":[20,63,85,99,145,155,175,207,249],"interactive":[21,86,235],"real-life":[22],"applications,":[23],"we":[24,124,185,201],"introduce":[25,187,202],"a":[26,53,72,96,126,136,157,162,188],"new":[27,73,199,204],"task":[28,89,238],"-":[29],"Interactive":[30],"Image":[31],"Editing,":[32],"where":[33],"users":[34],"can":[35],"guide":[36],"an":[37],"agent":[38,51],"to":[39,71,108,140,160],"edit":[40],"images":[41,174],"via":[42],"multi-turn":[43,211],"commands":[45],"on-the-fly.":[46],"In":[47],"each":[48,118,150],"session,":[49],"the":[50,58,61,65,76,100,113,142,146,153,166,172,178,193,198,217,226,234],"takes":[52],"natural":[54],"language":[55],"description":[56,148],"from":[57],"user":[59,77],"as":[60],"input,":[62],"modifies":[64],"image":[66,87,98,115,144,167,236,246],"generated":[67,97,114],"in":[68,82,117,149,216],"previous":[69,143],"turn":[70,151],"design,":[74],"following":[75],"description.":[78,179],"The":[79],"main":[80],"challenges":[81],"this":[83],"sequential":[84,189],"generation":[88],"two-fold:":[91],"1)":[92],"contextual":[93],"consistency":[94,111],"between":[95],"provided":[101],"description;":[103],"2)":[104],"step-by-step":[105],"region-level":[106],"modification":[107],"maintain":[109],"visual":[110,244],"across":[112,239],"sequence":[116,247],"session.":[119],"address":[121],"these":[122],"challenges,":[123],"propose":[125],"novel":[127],"Sequential":[128],"Attention":[129],"Generative":[130],"Adversarial":[131],"Network":[132],"(SeqAttnGAN),":[133],"which":[134,209],"applies":[135],"neural":[137],"state":[138],"tracker":[139],"encode":[141],"sequence,":[154],"uses":[156],"GAN":[158],"framework":[159],"generate":[161],"modified":[163],"version":[164],"that":[168,225],"is":[169],"consistent":[170],"with":[171,177,213],"preceding":[173],"coherent":[176],"achieve":[181],"better":[182],"region-specific":[183],"refinement,":[184],"also":[186],"attention":[190],"mechanism":[191],"into":[192],"model.":[194],"benchmark":[196],"task,":[200],"two":[203],"datasets,":[205],"Zap-Seq":[206],"DeepFashion-Seq,":[208],"contain":[210],"sessions":[212],"image-description":[214],"sequences":[215],"fashion":[218],"domain.":[219],"Experiments":[220],"both":[222],"datasets":[223],"show":[224],"proposed":[227],"SeqAttnGAN":[228],"model":[229],"outperforms":[230],"state-of-the-art":[231],"approaches":[232],"editing":[237],"all":[240],"evaluation":[241],"metrics":[242],"including":[243],"quality,":[245],"coherence":[248],"text-image":[250],"consistency.":[251]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":12},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":17},{"year":2021,"cited_by_count":14},{"year":2020,"cited_by_count":5}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
