{"id":"https://openalex.org/W4403791477","doi":"https://doi.org/10.1145/3664647.3680814","title":"Auto DragGAN: Editing the Generative Image Manifold in an Autoregressive Manner","display_name":"Auto DragGAN: Editing the Generative Image Manifold in an Autoregressive Manner","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403791477","doi":"https://doi.org/10.1145/3664647.3680814"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3680814","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680814","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111346135","display_name":"Pengxiang Cai","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Pengxiang Cai","raw_affiliation_strings":["Foundation Model Research Center, Institute of Automation, Chinese Academy of Sciences &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Foundation Model Research Center, Institute of Automation, Chinese Academy of Sciences &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107949838","display_name":"Zhiwei Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiwei Liu","raw_affiliation_strings":["Foundation Model Research Center, Institute of Automation, Chinese Academy of Sciences &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Foundation Model Research Center, Institute of Automation, Chinese Academy of Sciences &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029271867","display_name":"Guibo Zhu","orcid":"https://orcid.org/0000-0001-8293-3952"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guibo Zhu","raw_affiliation_strings":["Foundation Model Research Center, Institute of Automation, Chinese Academy of Science &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Foundation Model Research Center, Institute of Automation, Chinese Academy of Science &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101319174","display_name":"Yunfang Niu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunfang Niu","raw_affiliation_strings":["Foundation Model Research Center, Institute of Automation, Chinese Academy of Sciences &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Foundation Model Research Center, Institute of Automation, Chinese Academy of Sciences &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058420913","display_name":"Jinqiao Wang","orcid":"https://orcid.org/0000-0002-9118-2780"},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinqiao Wang","raw_affiliation_strings":["Foundation Model Research Center, Institute of Automation, Chinese Academy of Sciences &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Foundation Model Research Center, Institute of Automation, Chinese Academy of Sciences &amp; School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5111346135"],"corresponding_institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.2632,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.55579084,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"3372","last_page":"3380"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.7499775886535645},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5996825098991394},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5884122848510742},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5332797169685364},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.47943538427352905},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47080788016319275},{"id":"https://openalex.org/keywords/manifold","display_name":"Manifold (fluid mechanics)","score":0.4442242980003357},{"id":"https://openalex.org/keywords/star-model","display_name":"STAR model","score":0.4126951992511749},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3455069363117218},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.28618794679641724},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.14730286598205566},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.11412814259529114},{"id":"https://openalex.org/keywords/time-series","display_name":"Time series","score":0.0955427885055542},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08241242170333862},{"id":"https://openalex.org/keywords/autoregressive-integrated-moving-average","display_name":"Autoregressive integrated moving average","score":0.05055996775627136}],"concepts":[{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.7499775886535645},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5996825098991394},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5884122848510742},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5332797169685364},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.47943538427352905},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47080788016319275},{"id":"https://openalex.org/C529865628","wikidata":"https://www.wikidata.org/wiki/Q1790740","display_name":"Manifold (fluid mechanics)","level":2,"score":0.4442242980003357},{"id":"https://openalex.org/C194657046","wikidata":"https://www.wikidata.org/wiki/Q7394685","display_name":"STAR model","level":4,"score":0.4126951992511749},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3455069363117218},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.28618794679641724},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.14730286598205566},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.11412814259529114},{"id":"https://openalex.org/C151406439","wikidata":"https://www.wikidata.org/wiki/Q186588","display_name":"Time series","level":2,"score":0.0955427885055542},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08241242170333862},{"id":"https://openalex.org/C24338571","wikidata":"https://www.wikidata.org/wiki/Q2566298","display_name":"Autoregressive integrated moving average","level":3,"score":0.05055996775627136},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3664647.3680814","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680814","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4300000071525574,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2115252128","https://openalex.org/W2754925132","https://openalex.org/W2765811365","https://openalex.org/W2962770929","https://openalex.org/W3034600949","https://openalex.org/W3035574324","https://openalex.org/W3174807077","https://openalex.org/W3204682594","https://openalex.org/W4235375376","https://openalex.org/W4285981707","https://openalex.org/W4312782988","https://openalex.org/W4312933868","https://openalex.org/W4385527149","https://openalex.org/W4385535562","https://openalex.org/W4386057725","https://openalex.org/W4386076215","https://openalex.org/W4386076532","https://openalex.org/W6797179183"],"related_works":["https://openalex.org/W2439807930","https://openalex.org/W2009692134","https://openalex.org/W1972271943","https://openalex.org/W2019155478","https://openalex.org/W2024529895","https://openalex.org/W2168175994","https://openalex.org/W1902630399","https://openalex.org/W2120434453","https://openalex.org/W3120578569","https://openalex.org/W1487412319"],"abstract_inverted_index":{"Pixel-level":[0],"fine-grained":[1,28],"image":[2,60,216],"editing":[3,70,217],"remains":[4],"an":[5,13,175],"open":[6],"challenge.":[7],"Previous":[8],"works":[9],"fail":[10,24],"to":[11,25,49,97,115,128,161,171,179],"achieve":[12,26,139],"ideal":[14],"trade-off":[15],"between":[16],"control":[17],"granularity":[18],"and":[19,80,89,215],"inference":[20,32,213],"speed.":[21],"They":[22],"either":[23],"pixel-level":[27,66,221],"control,":[29],"or":[30],"their":[31,81],"speed":[33,214],"requires":[34],"optimization.":[35],"To":[36,138],"address":[37],"this,":[38,140],"this":[39],"paper":[40],"for":[41],"the":[42,51,59,124,130,143,163,181,194,199,220],"first":[43],"time":[44,73],"employs":[45],"a":[46,108,119,133,153,186],"regression-based":[47],"network":[48,157],"learn":[50],"variation":[52],"patterns":[53],"of":[54,132,136,201],"StyleGAN":[55],"latent":[56,164,195],"codes":[57],"during":[58],"dragging":[61,69],"process.":[62],"This":[63],"method":[64,91,209],"enables":[65],"precision":[67],"in":[68,174],"with":[71],"little":[72],"cost.":[74],"Users":[75],"can":[76],"specify":[77],"handle":[78,95,113,169],"points":[79,84,114,117,170,173],"corresponding":[82,99],"target":[83,100,116,172],"on":[85],"any":[86],"GAN-generated":[87],"images,":[88],"our":[90,208],"will":[92],"move":[93],"each":[94],"point":[96],"its":[98],"point.":[101],"Through":[102],"experimental":[103],"analysis,":[104],"we":[105,141,151,184],"discover":[106],"that":[107,207],"short":[109],"movement":[110,131,145],"distance":[111],"from":[112,168],"yields":[118],"high-fidelity":[120],"edited":[121],"image,":[122],"as":[123],"model":[125],"only":[126],"needs":[127],"predict":[129,162],"small":[134],"portion":[135],"pixels.":[137],"decompose":[142],"entire":[144],"process":[146],"into":[147],"multiple":[148],"sub-processes.":[149],"Specifically,":[150],"develop":[152],"transformer":[154],"encoder-decoder":[155],"based":[156],"named":[158,188],"'Latent":[159,189],"Predictor'":[160],"code":[165,196],"motion":[166,197],"trajectories":[167],"autoregressive":[176],"manner.":[177],"Moreover,":[178],"enhance":[180],"prediction":[182],"stability,":[183],"introduce":[185],"component":[187],"Regularizer',":[190],"aimed":[191],"at":[192,219],"constraining":[193],"within":[198],"distribution":[200],"natural":[202],"images.":[203],"Extensive":[204],"experiments":[205],"demonstrate":[206],"achieves":[210],"state-of-the-art":[211],"(SOTA)":[212],"performance":[218],"granularity.":[222]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
