{"id":"https://openalex.org/W7094957383","doi":"https://doi.org/10.1145/3746027.3755474","title":"AnchorSync: Global Consistency Optimization for Long Video Editing","display_name":"AnchorSync: Global Consistency Optimization for Long Video Editing","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W7094957383","doi":"https://doi.org/10.1145/3746027.3755474"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3755474","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755474","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Zichi Liu","orcid":"https://orcid.org/0009-0008-7154-4220"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zichi Liu","raw_affiliation_strings":["MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yinggui Wang","orcid":"https://orcid.org/0000-0002-6686-6603"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yinggui Wang","raw_affiliation_strings":["Ant Group, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Ant Group, Shanghai, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Tao Wei","orcid":"https://orcid.org/0009-0000-4027-0310"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tao Wei","raw_affiliation_strings":["Ant Group, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Ant Group, Shanghai, China","institution_ids":[]}]},{"author_position":"last","author":{"id":null,"display_name":"Chao Ma","orcid":"https://orcid.org/0000-0002-8459-2845"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Ma","raw_affiliation_strings":["MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.55635243,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4494","last_page":"4503"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.1687999963760376,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.1687999963760376,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T13720","display_name":"Benford\u2019s Law and Fraud Detection","score":0.1266999989748001,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13650","display_name":"Computational Physics and Python Applications","score":0.05999999865889549,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5662999749183655},{"id":"https://openalex.org/keywords/coherence","display_name":"Coherence (philosophical gambling strategy)","score":0.49230000376701355},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.46560001373291016},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.44440001249313354},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.42250001430511475},{"id":"https://openalex.org/keywords/data-consistency","display_name":"Data consistency","score":0.4025000035762787},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.3831999897956848},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.37959998846054077},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.34850001335144043}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.802299976348877},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5662999749183655},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5184000134468079},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.49230000376701355},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.46560001373291016},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.44440001249313354},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.42250001430511475},{"id":"https://openalex.org/C93361087","wikidata":"https://www.wikidata.org/wiki/Q4426698","display_name":"Data consistency","level":2,"score":0.4025000035762787},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.3831999897956848},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.37959998846054077},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3734000027179718},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.34850001335144043},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3301999866962433},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.31450000405311584},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.31380000710487366},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.29989999532699585},{"id":"https://openalex.org/C137105694","wikidata":"https://www.wikidata.org/wiki/Q3407510","display_name":"Local consistency","level":4,"score":0.28529998660087585},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.28360000252723694},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.2831999957561493},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.274399995803833},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.25940001010894775},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.25429999828338623},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.25279998779296875}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746027.3755474","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755474","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2956900569","https://openalex.org/W3113360161","https://openalex.org/W3214649539","https://openalex.org/W3216352822","https://openalex.org/W4313595665","https://openalex.org/W4387426141","https://openalex.org/W4404985095"],"related_works":[],"abstract_inverted_index":{"Editing":[0],"long":[1],"videos":[2],"remains":[3],"a":[4,40,70],"challenging":[5],"task":[6,53],"due":[7],"to":[8],"the":[9,52],"need":[10],"for":[11],"maintaining":[12],"both":[13],"global":[14],"consistency":[15,68],"and":[16,59,74,96],"temporal":[17,31,76,97],"coherence":[18],"across":[19],"thousands":[20],"of":[21],"frames.":[22],"Existing":[23],"methods":[24,92],"often":[25],"suffer":[26],"from":[27],"structural":[28,67],"drift":[29],"or":[30],"artifacts,":[32],"particularly":[33],"in":[34,93],"minute-long":[35],"sequences.":[36],"We":[37],"introduce":[38],"AnchorSync,":[39],"novel":[41],"diffusion-based":[42],"framework":[43],"that":[44,84],"enables":[45],"high-quality,":[46],"long-term":[47],"video":[48],"editing":[49,58],"by":[50],"decoupling":[51],"into":[54],"sparse":[55],"anchor":[56],"frame":[57,62],"smooth":[60],"intermediate":[61],"interpolation.":[63],"Our":[64],"approach":[65],"enforces":[66],"through":[69],"progressive":[71],"denoising":[72],"process":[73],"preserves":[75],"dynamics":[77],"via":[78],"multimodal":[79],"guidance.":[80],"Extensive":[81],"experiments":[82],"show":[83],"AnchorSync":[85],"produces":[86],"coherent,":[87],"high-fidelity":[88],"edits,":[89],"surpassing":[90],"prior":[91],"visual":[94],"quality":[95],"stability.":[98],"The":[99],"source":[100],"code":[101],"is":[102],"available":[103],"at":[104],"https://github.com/VISION-SJTU/AnchorSync.":[105]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-25T00:00:00"}
