{"id":"https://openalex.org/W7155501847","doi":"https://doi.org/10.48550/arxiv.2604.21776","title":"Reshoot-Anything: A Self-Supervised Model for In-the-Wild Video Reshooting","display_name":"Reshoot-Anything: A Self-Supervised Model for In-the-Wild Video Reshooting","publication_year":2026,"publication_date":"2026-04-23","ids":{"openalex":"https://openalex.org/W7155501847","doi":"https://doi.org/10.48550/arxiv.2604.21776"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.21776","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21776","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.21776","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006402988","display_name":"Avinash Paliwal","orcid":"https://orcid.org/0000-0002-9090-6142"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Paliwal, Avinash","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134475807","display_name":"Adithya Iyer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Iyer, Adithya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013394043","display_name":"Shivin Yadav","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yadav, Shivin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134486808","display_name":"Muhammad Ali Afridi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Afridi, Muhammad Ali","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5048294802","display_name":"Midhun Harikumar","orcid":"https://orcid.org/0009-0009-2199-5063"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Harikumar, Midhun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.24529999494552612,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.24529999494552612,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.210999995470047,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.1265999972820282,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.5443999767303467},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5072000026702881},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.37299999594688416},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.3594000041484833},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.33550000190734863},{"id":"https://openalex.org/keywords/subpixel-rendering","display_name":"Subpixel rendering","score":0.3212999999523163},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.3093000054359436}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7121999859809875},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6998000144958496},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6507999897003174},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.5443999767303467},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5072000026702881},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.37299999594688416},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.3594000041484833},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.33550000190734863},{"id":"https://openalex.org/C68516990","wikidata":"https://www.wikidata.org/wiki/Q452912","display_name":"Subpixel rendering","level":3,"score":0.3212999999523163},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.3093000054359436},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.29109999537467957},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.2833999991416931},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.2689000070095062},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.2678999900817871},{"id":"https://openalex.org/C2776035091","wikidata":"https://www.wikidata.org/wiki/Q7928819","display_name":"Viewpoints","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C154586513","wikidata":"https://www.wikidata.org/wiki/Q4420972","display_name":"Tracking system","level":3,"score":0.25600001215934753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.21776","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21776","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.21776","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21776","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Precise":[0],"camera":[1,182],"control":[2],"for":[3,17],"reshooting":[4],"dynamic":[5,191],"videos":[6],"is":[7,39,84,134],"bottlenecked":[8],"by":[9,62,87,142],"the":[10,40,77,89,93,103,121,128,156,161],"severe":[11],"scarcity":[12],"of":[13,31,42,48,92],"paired":[14],"multi-view":[15,44],"data":[16],"non-rigid":[18],"scenes.":[19,192],"We":[20,59],"overcome":[21],"this":[22,61],"limitation":[23],"with":[24,95],"a":[25,49,52,56,70,96,171],"highly":[26],"scalable":[27],"self-supervised":[28],"framework":[29],"capable":[30],"leveraging":[32],"internet-scale":[33],"monocular":[34],"videos.":[35],"Our":[36],"core":[37],"contribution":[38],"generation":[41],"pseudo":[43],"training":[45],"triplets,":[46],"consisting":[47],"source":[50,78,94,130,157],"video,":[51],"geometric":[53],"anchor,":[54],"and":[55,79,118,145,153,184],"target":[57,80],"video.":[58],"achieve":[60,177],"extracting":[63],"distinct":[64,151],"smooth":[65],"random-walk":[66],"crop":[67],"trajectories":[68],"from":[69,127,155],"single":[71],"input":[72],"video":[73,158],"to":[74,136,159,176],"serve":[75],"as":[76],"views.":[81],"The":[82],"anchor":[83,175],"synthetically":[85],"generated":[86],"forward-warping":[88],"first":[90],"frame":[91],"dense":[97],"tracking":[98],"field,":[99],"which":[100],"effectively":[101],"simulates":[102],"distorted":[104],"point-cloud":[105,173],"inputs":[106],"expected":[107],"at":[108],"inference.":[109],"Because":[110],"our":[111,165],"independent":[112],"cropping":[113],"strategy":[114],"introduces":[115],"spatial":[116],"misalignment":[117],"artificial":[119],"occlusions,":[120],"model":[122],"cannot":[123],"simply":[124],"copy":[125],"information":[126],"current":[129],"frame.":[131],"Instead,":[132],"it":[133],"forced":[135],"implicitly":[137],"learn":[138],"4D":[139,172],"spatiotemporal":[140],"structures":[141],"actively":[143],"routing":[144],"re-projecting":[146],"missing":[147],"high-fidelity":[148,185],"textures":[149],"across":[150],"times":[152],"viewpoints":[154],"reconstruct":[160],"target.":[162],"At":[163],"inference,":[164],"minimally":[166],"adapted":[167],"diffusion":[168],"transformer":[169],"utilizes":[170],"derived":[174],"state-of-the-art":[178],"temporal":[179],"consistency,":[180],"robust":[181],"control,":[183],"novel":[186],"view":[187],"synthesis":[188],"on":[189],"complex":[190]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-25T00:00:00"}
