{"id":"https://openalex.org/W4415539071","doi":"https://doi.org/10.1145/3746027.3758205","title":"<scp>EditWorld:</scp> Simulating World Dynamics for Instruction-Following Image Editing","display_name":"<scp>EditWorld:</scp> Simulating World Dynamics for Instruction-Following Image Editing","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415539071","doi":"https://doi.org/10.1145/3746027.3758205"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3758205","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746027.3758205","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3746027.3758205","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101788611","display_name":"Bohan Zeng","orcid":"https://orcid.org/0009-0009-9019-6097"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bohan Zeng","raw_affiliation_strings":["Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022659405","display_name":"L. Yang","orcid":"https://orcid.org/0000-0003-1905-8053"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ling Yang","raw_affiliation_strings":["Princeton University, Princeton, USA and Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Princeton University, Princeton, USA and Peking University, Beijing, China","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107063648","display_name":"Jiaming Liu","orcid":"https://orcid.org/0009-0001-4584-9388"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaming Liu","raw_affiliation_strings":["Alibaba Group, Beijing, China and Tiamat AI, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China and Tiamat AI, Shanghai, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103079796","display_name":"Minghao Xu","orcid":"https://orcid.org/0000-0001-7468-8790"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minghao Xu","raw_affiliation_strings":["Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020022791","display_name":"Yuanxing Zhang","orcid":"https://orcid.org/0000-0003-1460-8124"},"institutions":[{"id":"https://openalex.org/I4210108109","display_name":"Beijing Enterprises (China)","ror":"https://ror.org/01egb4878","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210108109"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanxing Zhang","raw_affiliation_strings":["Kling Team, Kuaishou, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Kling Team, Kuaishou, Beijing, China","institution_ids":["https://openalex.org/I4210108109"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101928510","display_name":"Pengfei Wan","orcid":"https://orcid.org/0000-0001-7225-565X"},"institutions":[{"id":"https://openalex.org/I4210108109","display_name":"Beijing Enterprises (China)","ror":"https://ror.org/01egb4878","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210108109"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengfei Wan","raw_affiliation_strings":["Kling Team, Kuaishou, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Kling Team, Kuaishou, Beijing, China","institution_ids":["https://openalex.org/I4210108109"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008772211","display_name":"Wentao Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wentao Zhang","raw_affiliation_strings":["Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100381753","display_name":"Shuicheng Yan","orcid":"https://orcid.org/0000-0001-8906-3777"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Shuicheng Yan","raw_affiliation_strings":["National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5101788611"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":1.2181,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.84527884,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"12674","last_page":"12681"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9836999773979187,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9836999773979187,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9610000252723694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9435999989509583,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.9355000257492065},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.6929000020027161},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5863999724388123},{"id":"https://openalex.org/keywords/dynamics","display_name":"Dynamics (music)","score":0.532800018787384},{"id":"https://openalex.org/keywords/video-editing","display_name":"Video editing","score":0.4309000074863434},{"id":"https://openalex.org/keywords/train","display_name":"Train","score":0.36489999294281006}],"concepts":[{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.9355000257492065},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8034999966621399},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.6929000020027161},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5863999724388123},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.532800018787384},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4339999854564667},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.4309000074863434},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.42579999566078186},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.38769999146461487},{"id":"https://openalex.org/C190839683","wikidata":"https://www.wikidata.org/wiki/Q2448197","display_name":"Train","level":2,"score":0.36489999294281006},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3440000116825104},{"id":"https://openalex.org/C87829876","wikidata":"https://www.wikidata.org/wiki/Q648877","display_name":"Post-production","level":2,"score":0.33410000801086426},{"id":"https://openalex.org/C2987933465","wikidata":"https://www.wikidata.org/wiki/Q141130","display_name":"Image manipulation","level":3,"score":0.3262999951839447},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.3052000105381012},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.3003000020980835},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.2542000114917755},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.25209999084472656}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746027.3758205","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746027.3758205","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3746027.3758205","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746027.3758205","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8708956154","display_name":null,"funder_award_id":"2024YFA1014003","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W3107803166","https://openalex.org/W3173143063","https://openalex.org/W3216352822","https://openalex.org/W4312529357","https://openalex.org/W4312872987","https://openalex.org/W4312933868","https://openalex.org/W4386076215","https://openalex.org/W4386113271","https://openalex.org/W4390873054","https://openalex.org/W4390874575","https://openalex.org/W4402716297","https://openalex.org/W4402716387","https://openalex.org/W4402727613"],"related_works":[],"abstract_inverted_index":{"Diffusion":[0],"models":[1,121],"have":[2],"significantly":[3,158],"improved":[4],"the":[5,73,78,98,142],"performance":[6],"of":[7,65,68,118,131],"image":[8,18,92,109,135],"editing.":[9],"Existing":[10],"methods":[11,162],"realize":[12],"various":[13,102],"approaches":[14],"to":[15,24],"achieve":[16],"high-quality":[17],"editing,":[19,93,136],"including":[20],"but":[21],"not":[22],"limited":[23],"text":[25],"control,":[26],"dragging":[27],"operation,":[28],"and":[29,40,62,96,125,145],"mask-and-inpainting.":[30],"Among":[31],"these,":[32],"instruction-based":[33],"editing":[34,55,88,110,161],"stands":[35],"out":[36],"for":[37,134],"its":[38],"convenience":[39],"effectiveness":[41],"in":[42,77,141,163],"following":[43],"human":[44],"instructions":[45,99,114],"across":[46],"diverse":[47],"scenarios.":[48,104],"However,":[49],"it":[50],"still":[51],"focuses":[52],"on":[53],"simple":[54],"operations":[56],"like":[57],"adding,":[58],"replacing,":[59],"or":[60],"deleting,":[61],"falls":[63],"short":[64],"understanding":[66],"aspects":[67],"world":[69,103,113,132],"dynamics":[70,133],"that":[71],"convey":[72],"realistic":[74],"dynamic":[75],"nature":[76],"physical":[79],"world.":[80],"Therefore,":[81],"this":[82,164],"work":[83],"EditWorld":[84,138],"introduces":[85],"a":[86,107,116],"new":[87,108,165],"task,":[89],"namely":[90],"world-instructed":[91],"which":[94],"defines":[95],"categorizes":[97],"grounded":[100],"by":[101],"We":[105],"curate":[106],"dataset":[111],"with":[112,149],"using":[115],"set":[117],"large":[119],"pretrained":[120],"(e.g.,":[122],"GPT,":[123],"Video-LLava":[124],"SDXL).":[126],"To":[127],"enable":[128],"sufficient":[129],"simulation":[130],"our":[137,156],"trains":[139],"model":[140],"curated":[143],"dataset,":[144],"improves":[146],"instruction-following":[147],"ability":[148],"designed":[150],"post-edit":[151],"strategy.":[152],"Extensive":[153],"experiments":[154],"demonstrate":[155],"method":[157],"outperforms":[159],"existing":[160],"task.":[166],"https://github.com/YangLing0818/EditWorld":[167]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-25T00:00:00"}
