{"id":"https://openalex.org/W7162466477","doi":"https://doi.org/10.48550/arxiv.2605.25308","title":"Stabilizing Streaming Video Geometry via Dynamic Feature Normalization","display_name":"Stabilizing Streaming Video Geometry via Dynamic Feature Normalization","publication_year":2026,"publication_date":"2026-05-25","ids":{"openalex":"https://openalex.org/W7162466477","doi":"https://doi.org/10.48550/arxiv.2605.25308"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.25308","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25308","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.25308","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137052613","display_name":"Xiaoyang Lyu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lyu, Xiaoyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137061873","display_name":"Muxin Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Muxin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137013648","display_name":"Xiaoshan Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Xiaoshan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137029000","display_name":"Ruicheng Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Ruicheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136995426","display_name":"Yi-Hua Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Yi-Hua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137029584","display_name":"Yang-Tian Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Yang-Tian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137001123","display_name":"Shaoshuai Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Shaoshuai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137004931","display_name":"Xiaojuan Qi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi, Xiaojuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.7226999998092651,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.7226999998092651,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.11079999804496765,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.05009999871253967,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.6280999779701233},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5853999853134155},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.5516999959945679},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.5335999727249146},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40369999408721924},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.3693000078201294},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.3594000041484833}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6503000259399414},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.6280999779701233},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6054999828338623},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5853999853134155},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.5516999959945679},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.5335999727249146},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5123999714851379},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40369999408721924},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3693000078201294},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.3594000041484833},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.35120001435279846},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3231000006198883},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.29739999771118164},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.28299999237060547},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.27869999408721924},{"id":"https://openalex.org/C39927690","wikidata":"https://www.wikidata.org/wiki/Q11197","display_name":"Logarithm","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C158843486","wikidata":"https://www.wikidata.org/wiki/Q2137810","display_name":"Complex geometry","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.26820001006126404}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.25308","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25308","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.25308","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25308","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Consistent":[0],"3D":[1],"geometry":[2,25,99,107],"estimation":[3],"from":[4],"streaming":[5,110,160],"RGB":[6],"input":[7],"is":[8],"crucial":[9],"for":[10,109],"real-world":[11],"applications":[12],"such":[13,145],"as":[14,146],"autonomous":[15],"driving,":[16],"embodied":[17],"AI,":[18],"and":[19,64,72,91,149,152,166],"large-scale":[20],"reconstruction.":[21],"While":[22],"modern":[23],"monocular":[24,106],"foundation":[26],"models":[27,108],"achieve":[28],"strong":[29],"single-image":[30,131],"accuracy,":[31],"they":[32],"exhibit":[33],"severe":[34],"temporal":[35,127,143,155],"inconsistency":[36],"on":[37,75],"continuous":[38],"input,":[39],"notably":[40],"dominated":[41],"by":[42,111,162],"scale--shift":[43],"drifting.":[44],"Through":[45],"targeted":[46],"empirical":[47],"analysis,":[48],"we":[49,78],"trace":[50],"this":[51,76],"instability":[52],"to":[53,96,164],"its":[54],"root":[55],"cause:":[56],"fluctuations":[57],"in":[58],"latent":[59],"feature":[60,94],"statistics,":[61],"whose":[62],"mean":[63],"variance":[65],"directly":[66],"determine":[67],"the":[68,122],"predicted":[69],"depth's":[70],"scale":[71],"shift.":[73],"Building":[74],"insight,":[77],"introduce":[79],"Dynamic":[80],"Feature":[81],"Normalization":[82],"(DyFN),":[83],"a":[84,115],"lightweight,":[85],"causal":[86],"recurrent":[87],"module":[88],"that":[89,139],"dynamically":[90],"robustly":[92],"modulates":[93],"statistics":[95],"maintain":[97],"stable":[98],"over":[100,158],"time.":[101],"We":[102],"adapt":[103],"powerful":[104],"pretrained":[105],"finetuning":[112],"only":[113],"DyFN,":[114],"mere":[116],"2\\%":[117],"additional":[118],"parameters,":[119],"while":[120],"keeping":[121],"backbone":[123],"frozen,":[124],"thereby":[125],"achieving":[126],"consistency":[128],"without":[129],"compromising":[130],"accuracy.":[132],"Extensive":[133],"experiments":[134],"across":[135],"four":[136],"benchmarks":[137],"show":[138],"DyFN":[140],"effectively":[141],"eliminates":[142],"artifacts":[144],"disjointed":[147],"layering":[148],"positional":[150],"jitter,":[151],"achieves":[153],"state-of-the-art":[154],"stability,":[156],"improving":[157],"prior":[159],"methods":[161],"up":[163],"14\\%":[165],"even":[167],"outperforming":[168],"heavier":[169],"non-causal":[170],"video":[171],"baselines.":[172],"Project":[173],"Page:":[174],"https://shawlyu.github.io/DyFN":[175]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-27T00:00:00"}
