{"id":"https://openalex.org/W7140159933","doi":"https://doi.org/10.48550/arxiv.2603.21785","title":"Image-Conditioned Adaptive Parameter Tuning for Visual Odometry Frontends","display_name":"Image-Conditioned Adaptive Parameter Tuning for Visual Odometry Frontends","publication_year":2026,"publication_date":"2026-03-23","ids":{"openalex":"https://openalex.org/W7140159933","doi":"https://doi.org/10.48550/arxiv.2603.21785"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.21785","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21785","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.21785","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Nascivera, Simone","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Nascivera, Simone","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Bauersfeld, Leonard","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bauersfeld, Leonard","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Delaune, Jeff","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Delaune, Jeff","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Scaramuzza, Davide","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Scaramuzza, Davide","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.8553000092506409,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.8553000092506409,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.09200000017881393,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.008799999952316284,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6371999979019165},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6044999957084656},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5227000117301941},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.4925999939441681},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.47189998626708984},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.4555000066757202},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.4431999921798706},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.40689998865127563},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.4020000100135803}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7401000261306763},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6452000141143799},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6371999979019165},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6044999957084656},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5357999801635742},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5227000117301941},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.4925999939441681},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.47189998626708984},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.4555000066757202},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.4431999921798706},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.40689998865127563},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.4020000100135803},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.39590001106262207},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.3871999979019165},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.38089999556541443},{"id":"https://openalex.org/C5799516","wikidata":"https://www.wikidata.org/wiki/Q4110915","display_name":"Visual odometry","level":3,"score":0.3693999946117401},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3472000062465668},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.33309999108314514},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.3208000063896179},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.3151000142097473},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.3073999881744385},{"id":"https://openalex.org/C2987395694","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Feature tracking","level":3,"score":0.3073999881744385},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3066999912261963},{"id":"https://openalex.org/C49441653","wikidata":"https://www.wikidata.org/wiki/Q2014717","display_name":"Odometry","level":4,"score":0.26910001039505005},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2653000056743622},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.25440001487731934}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.21785","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21785","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.21785","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21785","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6014755964279175,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Resource-constrained":[0],"autonomous":[1],"robots":[2],"rely":[3,145],"on":[4,32,147,165],"sparse":[5],"direct":[6],"and":[7,21,39,65,111,123,134,157,167,175],"semi-direct":[8],"visual-(inertial)-odometry":[9],"(VO)":[10],"pipelines,":[11],"as":[12,59,106],"they":[13],"provide":[14],"a":[15,107,113,129,135],"favorable":[16],"tradeoff":[17],"between":[18],"accuracy,":[19],"robustness,":[20],"computational":[22,178],"cost.":[23],"However,":[24],"the":[25,77,92,95,103,154],"performance":[26,71],"of":[27,86],"most":[28],"systems":[29],"depends":[30],"critically":[31],"hand-tuned":[33],"hyperparameters":[34],"governing":[35],"feature":[36,121,173],"detection,":[37],"tracking,":[38],"outlier":[40],"rejection.":[41],"These":[42],"parameters":[43,160],"are":[44],"typically":[45],"fixed":[46],"during":[47,138],"deployment,":[48],"even":[49],"though":[50],"their":[51],"optimal":[52],"values":[53],"vary":[54],"with":[55],"scene":[56],"characteristics":[57],"such":[58],"texture":[60],"density,":[61],"illumination,":[62],"motion":[63],"blur,":[64],"sensor":[66],"noise,":[67],"leading":[68],"to":[69,101,120],"brittle":[70],"in":[72,183],"real-world":[73],"environments.":[74],"We":[75],"propose":[76],"first":[78],"image-conditioned":[79],"reinforcement":[80],"learning":[81],"framework":[82],"for":[83],"online":[84],"tuning":[85],"VO":[87,149],"frontend":[88,104],"parameters,":[89],"effectively":[90],"embedding":[91],"expert":[93],"into":[94],"system.":[96],"Our":[97],"key":[98],"idea":[99],"is":[100],"formulate":[102],"configuration":[105],"sequential":[108],"decision-making":[109],"problem":[110],"learn":[112],"policy":[114,127],"that":[115,144],"directly":[116],"maps":[117],"visual":[118],"input":[119],"detection":[122],"tracking":[124,162],"parameters.":[125],"The":[126],"uses":[128],"lightweight":[130],"texture-aware":[131],"CNN":[132],"encoder":[133],"privileged":[136],"critic":[137],"training.":[139],"Unlike":[140],"prior":[141],"RL-based":[142],"approaches":[143],"solely":[146],"internal":[148],"statistics,":[150],"our":[151],"method":[152],"observes":[153],"image":[155],"content":[156],"proactively":[158],"adapts":[159],"before":[161],"degrades.":[163],"Experiments":[164],"TartanAirV2":[166],"TUM":[168],"RGB-D":[169],"show":[170],"3x":[171,176],"longer":[172],"tracks":[174],"lower":[177],"cost,":[179],"despite":[180],"training":[181],"entirely":[182],"simulation.":[184]},"counts_by_year":[],"updated_date":"2026-04-25T08:17:42.794288","created_date":"2026-03-25T00:00:00"}
