{"id":"https://openalex.org/W7139950550","doi":"https://doi.org/10.48550/arxiv.2603.19224","title":"EffectErase: Joint Video Object Removal and Insertion for High-Quality Effect Erasing","display_name":"EffectErase: Joint Video Object Removal and Insertion for High-Quality Effect Erasing","publication_year":2026,"publication_date":"2026-03-19","ids":{"openalex":"https://openalex.org/W7139950550","doi":"https://doi.org/10.48550/arxiv.2603.19224"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.19224","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19224","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.19224","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130231423","display_name":"Yang Fu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Fu, Yang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130242793","display_name":"Yike Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Yike","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073327273","display_name":"Ziyun Dai","orcid":"https://orcid.org/0009-0002-6560-3972"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dai, Ziyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130233831","display_name":"Henghui Ding","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Henghui","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5130231423"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8977000117301941,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8977000117301941,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.02280000038444996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.022099999710917473,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.8183000087738037},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6503999829292297},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.5846999883651733},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.53329998254776},{"id":"https://openalex.org/keywords/method","display_name":"Method","score":0.5218999981880188},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4666000008583069},{"id":"https://openalex.org/keywords/reciprocal","display_name":"Reciprocal","score":0.4537000060081482}],"concepts":[{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.8183000087738037},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7796000242233276},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7189000248908997},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6776999831199646},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6503999829292297},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.5846999883651733},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.53329998254776},{"id":"https://openalex.org/C512554520","wikidata":"https://www.wikidata.org/wiki/Q815844","display_name":"Method","level":3,"score":0.5218999981880188},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4666000008583069},{"id":"https://openalex.org/C2777742833","wikidata":"https://www.wikidata.org/wiki/Q1964083","display_name":"Reciprocal","level":2,"score":0.4537000060081482},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.4196999967098236},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.392300009727478},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.33570000529289246},{"id":"https://openalex.org/C20894473","wikidata":"https://www.wikidata.org/wiki/Q1116105","display_name":"Object model","level":3,"score":0.319599986076355},{"id":"https://openalex.org/C53073257","wikidata":"https://www.wikidata.org/wiki/Q7075021","display_name":"Object-oriented design","level":3,"score":0.2922999858856201},{"id":"https://openalex.org/C11727466","wikidata":"https://www.wikidata.org/wiki/Q1628157","display_name":"Inpainting","level":3,"score":0.2824000120162964},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2777999937534332},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.19224","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19224","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.19224","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19224","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Video":[0],"object":[1,28,65,99,110,117,140,158,164,224],"removal":[2,29,159],"aims":[3],"to":[4,38,43],"eliminate":[5],"dynamic":[6,146],"target":[7,98],"objects":[8,34],"and":[9,17,27,42,72,105,111,127,134,188,202,208],"their":[10],"visual":[11],"effects,":[12],"such":[13],"as":[14,142,144,166],"deformation,":[15],"shadows,":[16],"reflections,":[18],"while":[19],"restoring":[20],"seamless":[21],"backgrounds.":[22,46],"Recent":[23],"diffusion-based":[24],"video":[25,95,123,157,163,223],"inpainting":[26],"methods":[30],"can":[31],"remove":[32],"the":[33,55,97,109,167],"but":[35],"often":[36],"struggle":[37],"erase":[39],"these":[40],"effects":[41,66,104,112,132],"synthesize":[44],"coherent":[45],"Beyond":[47],"method":[48,160],"limitations,":[49],"progress":[50],"is":[51,100],"further":[52],"hampered":[53],"by":[54],"lack":[56],"of":[57,93,139,205],"a":[58,83,106,136,172],"comprehensive":[59],"dataset":[60,85],"that":[61,86,161,182,198],"systematically":[62],"captures":[63],"common":[64],"across":[67,227],"varied":[68],"environments":[69],"for":[70],"training":[71],"evaluation.":[73],"To":[74],"address":[75],"this,":[76],"we":[77,152],"introduce":[78],"VOR":[79,119],"(Video":[80],"Object":[81],"Removal),":[82],"large-scale":[84],"provides":[87],"diverse":[88,228],"paired":[89],"videos,":[90],"each":[91],"consisting":[92],"one":[94],"where":[96,108],"present":[101],"with":[102,115],"its":[103],"counterpart":[107],"are":[113],"absent,":[114],"corresponding":[116],"masks.":[118],"contains":[120],"60K":[121],"high-quality":[122,222],"pairs":[124],"from":[125],"captured":[126],"synthetic":[128],"sources,":[129],"covers":[130],"five":[131],"types,":[133],"spans":[135],"wide":[137],"range":[138],"categories":[141],"well":[143],"complex,":[145],"multi-object":[147],"scenes.":[148],"Building":[149],"on":[150,185,212],"VOR,":[151,213],"propose":[153],"EffectErase,":[154],"an":[155,194],"effect-aware":[156],"treats":[162],"insertion":[165],"inverse":[168],"auxiliary":[169],"task":[170,191],"within":[171],"reciprocal":[173],"learning":[174,184],"scheme.":[175],"The":[176],"model":[177],"includes":[178],"task-aware":[179],"region":[180],"guidance":[181],"focuses":[183],"affected":[186],"areas":[187],"enables":[189],"flexible":[190],"switching.":[192],"Then,":[193],"insertion-removal":[195],"consistency":[196],"objective":[197],"encourages":[199],"complementary":[200],"behaviors":[201],"shared":[203],"localization":[204],"effect":[206,225],"regions":[207],"structural":[209],"cues.":[210],"Trained":[211],"EffectErase":[214],"achieves":[215],"superior":[216],"performance":[217],"in":[218],"extensive":[219],"experiments,":[220],"delivering":[221],"erasing":[226],"scenarios.":[229]},"counts_by_year":[],"updated_date":"2026-03-21T06:36:02.116451","created_date":"2026-03-21T00:00:00"}
