{"id":"https://openalex.org/W7128521135","doi":"https://doi.org/10.48550/arxiv.2602.08068","title":"ReRoPE: Repurposing RoPE for Relative Camera Control","display_name":"ReRoPE: Repurposing RoPE for Relative Camera Control","publication_year":2026,"publication_date":"2026-02-08","ids":{"openalex":"https://openalex.org/W7128521135","doi":"https://doi.org/10.48550/arxiv.2602.08068"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.08068","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125483641","display_name":"Chunyang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Chunyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125525331","display_name":"Yuanbo Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yuanbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125483758","display_name":"Jiahao Shao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shao, Jiahao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125584638","display_name":"Hongyu Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Hongyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110696266","display_name":"Katja Schwarz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schwarz, Katja","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125569554","display_name":"Yiyi Liao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liao, Yiyi","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5125483641"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.707099974155426,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.707099974155426,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.10040000081062317,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.02800000086426735,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/camera-auto-calibration","display_name":"Camera auto-calibration","score":0.39899998903274536},{"id":"https://openalex.org/keywords/video-camera","display_name":"Video camera","score":0.39469999074935913},{"id":"https://openalex.org/keywords/smart-camera","display_name":"Smart camera","score":0.38920000195503235},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.37929999828338623},{"id":"https://openalex.org/keywords/repurposing","display_name":"Repurposing","score":0.3788999915122986},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.3529999852180481},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.3456999957561493},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.314300000667572}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7398999929428101},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6535000205039978},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6492999792098999},{"id":"https://openalex.org/C94816000","wikidata":"https://www.wikidata.org/wiki/Q5026006","display_name":"Camera auto-calibration","level":3,"score":0.39899998903274536},{"id":"https://openalex.org/C2778852477","wikidata":"https://www.wikidata.org/wiki/Q313614","display_name":"Video camera","level":2,"score":0.39469999074935913},{"id":"https://openalex.org/C161334170","wikidata":"https://www.wikidata.org/wiki/Q1428778","display_name":"Smart camera","level":2,"score":0.38920000195503235},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.37929999828338623},{"id":"https://openalex.org/C519536355","wikidata":"https://www.wikidata.org/wiki/Q21021151","display_name":"Repurposing","level":2,"score":0.3788999915122986},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.3529999852180481},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.3456999957561493},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.314300000667572},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.31310001015663147},{"id":"https://openalex.org/C2778022956","wikidata":"https://www.wikidata.org/wiki/Q192234","display_name":"Camera lens","level":3,"score":0.3059999942779541},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.29679998755455017},{"id":"https://openalex.org/C2779705975","wikidata":"https://www.wikidata.org/wiki/Q62927","display_name":"Digital camera","level":2,"score":0.29330000281333923},{"id":"https://openalex.org/C2776035091","wikidata":"https://www.wikidata.org/wiki/Q7928819","display_name":"Viewpoints","level":2,"score":0.2913999855518341},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.28029999136924744},{"id":"https://openalex.org/C162269090","wikidata":"https://www.wikidata.org/wiki/Q1156047","display_name":"Rope","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C119657128","wikidata":"https://www.wikidata.org/wiki/Q11633","display_name":"Photography","level":2,"score":0.27630001306533813},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C151211776","wikidata":"https://www.wikidata.org/wiki/Q2778015","display_name":"Video capture","level":3,"score":0.2639999985694885}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.08068","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.08068","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.08068","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.08068","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Video":[0],"generation":[1,100],"with":[2],"controllable":[3],"camera":[4,26,52,90,131,163],"viewpoints":[5],"is":[6,104],"essential":[7],"for":[8,186],"applications":[9],"such":[10],"as":[11],"interactive":[12],"content":[13],"creation,":[14],"gaming,":[15],"and":[16,47,156,166],"simulation.":[17],"Existing":[18],"methods":[19],"typically":[20],"adapt":[21],"pre-trained":[22,68,93,145],"video":[23,69,94,181],"models":[24,71,96,116],"using":[25],"poses":[27],"relative":[28,51,89,130],"to":[29,44],"a":[30,61,84,175],"fixed":[31],"reference,":[32],"e.g.,":[33],"the":[34,107,124],"first":[35],"frame.":[36],"However,":[37],"these":[38,135],"encodings":[39],"lack":[40],"shift-invariance,":[41],"often":[42],"leading":[43],"poor":[45],"generalization":[46],"accumulated":[48],"drift.":[49],"While":[50],"pose":[53,132],"embeddings":[54],"defined":[55],"between":[56],"arbitrary":[57],"view":[58],"pairs":[59],"offer":[60],"more":[62,187],"robust":[63],"alternative,":[64],"integrating":[65],"them":[66],"into":[67,92,134],"diffusion":[70,95],"without":[72,97],"prohibitive":[73],"training":[74],"costs":[75],"or":[76],"architectural":[77],"changes":[78],"remains":[79],"challenging.":[80],"We":[81,148],"introduce":[82],"ReRoPE,":[83],"plug-and-play":[85],"framework":[86],"that":[87,109,172],"incorporates":[88],"information":[91,133],"compromising":[98],"their":[99,118],"capability.":[101],"Our":[102,169],"approach":[103],"based":[105],"on":[106,152],"insight":[108],"Rotary":[110],"Positional":[111],"Embeddings":[112],"(RoPE)":[113],"in":[114,123,160],"existing":[115],"underutilize":[117],"full":[119],"spectral":[120],"bandwidth,":[121],"particularly":[122],"low-frequency":[125],"components.":[126],"By":[127],"seamlessly":[128],"injecting":[129],"underutilized":[136],"bands,":[137],"ReRoPE":[138,173],"achieves":[139],"precise":[140],"control":[141,164],"while":[142],"preserving":[143],"strong":[144],"generative":[146],"priors.":[147],"evaluate":[149],"our":[150],"method":[151],"both":[153],"image-to-video":[154],"(I2V)":[155],"video-to-video":[157],"(V2V)":[158],"tasks":[159],"terms":[161],"of":[162],"accuracy":[165],"visual":[167],"fidelity.":[168],"results":[170],"demonstrate":[171],"offers":[174],"training-efficient":[176],"path":[177],"toward":[178],"controllable,":[179],"high-fidelity":[180],"generation.":[182],"See":[183],"project":[184],"page":[185],"results:":[188],"https://sisyphe-lee.github.io/ReRoPE/":[189]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-11T00:00:00"}
