{"id":"https://openalex.org/W7134896412","doi":"https://doi.org/10.48550/arxiv.2603.09819","title":"ConfCtrl: Enabling Precise Camera Control in Video Diffusion via Confidence-Aware Interpolation","display_name":"ConfCtrl: Enabling Precise Camera Control in Video Diffusion via Confidence-Aware Interpolation","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7134896412","doi":"https://doi.org/10.48550/arxiv.2603.09819"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.09819","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09819","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.09819","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yang, Liudi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yang, Liudi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049254859","display_name":"George Eskandar","orcid":"https://orcid.org/0000-0002-8099-8717"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eskandar, George","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052009653","display_name":"Fengyi Shen","orcid":"https://orcid.org/0000-0001-7621-9779"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Fengyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128736995","display_name":"Mohammad Altillawi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Altillawi, Mohammad","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128798439","display_name":"Yang Bai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128728375","display_name":"Chi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128734247","display_name":"Ziyuan Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Ziyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128774135","display_name":"Abhinav Valada","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Valada, Abhinav","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.6814000010490417,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.6814000010490417,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.14740000665187836,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.08829999715089798,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.6769999861717224},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5861999988555908},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.5297999978065491},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.47440001368522644},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4578999876976013},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.4562999904155731},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.453900009393692},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.40779998898506165}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7416999936103821},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7142999768257141},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.6769999861717224},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6662999987602234},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5861999988555908},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.5297999978065491},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.47440001368522644},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4578999876976013},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.4562999904155731},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.453900009393692},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.40779998898506165},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.3264999985694885},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.31610000133514404},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.311599999666214},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.3082999885082245},{"id":"https://openalex.org/C68710425","wikidata":"https://www.wikidata.org/wiki/Q5275442","display_name":"Diffusion process","level":3,"score":0.303600013256073},{"id":"https://openalex.org/C141379421","wikidata":"https://www.wikidata.org/wiki/Q6094427","display_name":"Iterative reconstruction","level":2,"score":0.2897999882698059},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.2856000065803528},{"id":"https://openalex.org/C2777774050","wikidata":"https://www.wikidata.org/wiki/Q16945110","display_name":"Control point","level":2,"score":0.273499995470047},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.258899986743927}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.09819","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09819","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.09819","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09819","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0],"address":[1,49],"the":[2,21,75,89,100,123],"challenge":[3],"of":[4],"novel":[5,151],"view":[6],"synthesis":[7],"from":[8,33,45],"only":[9],"two":[10],"input":[11],"images":[12],"under":[13,157],"large":[14,158],"viewpoint":[15,159],"changes.":[16,160],"Existing":[17],"regression-based":[18],"methods":[19],"lack":[20],"capacity":[22],"to":[23,37,64,113,125],"reconstruct":[24],"unseen":[25,71],"regions,":[26,133],"while":[27,69,130],"camera-guided":[28],"diffusion":[29,62,76],"models":[30,63],"often":[31],"deviate":[32],"intended":[34],"trajectories":[35],"due":[36],"noisy":[38,106,118],"point":[39,83,102],"cloud":[40,84,103],"projections":[41,129],"or":[42],"insufficient":[43],"conditioning":[44,90],"camera":[46,67],"poses.":[47],"To":[48],"these":[50],"issues,":[51],"we":[52],"propose":[53],"ConfCtrl,":[54],"a":[55,80,95,105],"confidence-aware":[56],"video":[57],"interpolation":[58],"framework":[59],"that":[60,143],"enables":[61],"follow":[65],"prescribed":[66],"poses":[68],"completing":[70],"regions.":[72],"ConfCtrl":[73,144],"initializes":[74],"process":[77],"by":[78],"combining":[79],"confidence-weighted":[81],"projected":[82,101],"latent":[85],"with":[86,117],"noise":[87],"as":[88,104],"input.":[91],"It":[92],"then":[93],"applies":[94],"Kalman-inspired":[96],"predict-update":[97],"mechanism,":[98],"treating":[99],"measurement":[107],"and":[108,148],"using":[109],"learned":[110],"residual":[111],"corrections":[112],"balance":[114],"pose-driven":[115],"predictions":[116],"geometric":[119],"observations.":[120],"This":[121],"allows":[122],"model":[124],"rely":[126],"on":[127,139],"reliable":[128],"down-weighting":[131],"uncertain":[132],"yielding":[134],"stable,":[135],"geometry-aware":[136],"generation.":[137],"Experiments":[138],"multiple":[140],"datasets":[141],"show":[142],"produces":[145],"geometrically":[146],"consistent":[147],"visually":[149],"plausible":[150],"views,":[152],"effectively":[153],"reconstructing":[154],"occluded":[155],"regions":[156]},"counts_by_year":[],"updated_date":"2026-05-04T08:30:34.212998","created_date":"2026-03-12T00:00:00"}
