{"id":"https://openalex.org/W4406753856","doi":"https://doi.org/10.1109/tcsvt.2025.3533256","title":"KPDepth-VO: Self-Supervised Learning of Scale-Consistent Visual Odometry and Depth With Keypoint Features From Monocular Video","display_name":"KPDepth-VO: Self-Supervised Learning of Scale-Consistent Visual Odometry and Depth With Keypoint Features From Monocular Video","publication_year":2025,"publication_date":"2025-01-23","ids":{"openalex":"https://openalex.org/W4406753856","doi":"https://doi.org/10.1109/tcsvt.2025.3533256"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2025.3533256","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3533256","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048024916","display_name":"Changhao Wang","orcid":"https://orcid.org/0000-0002-2142-0632"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changhao Wang","raw_affiliation_strings":["Visual Intelligent Processing Laboratory, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, Shaanxi, China","School of Electronics and Information, Visual Intelligent Processing Laboratory, Northwestern Polytechnical University, Xi&#x2019;an, Shannxi, P.R.China"],"raw_orcid":"https://orcid.org/0000-0002-2142-0632","affiliations":[{"raw_affiliation_string":"Visual Intelligent Processing Laboratory, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"School of Electronics and Information, Visual Intelligent Processing Laboratory, Northwestern Polytechnical University, Xi&#x2019;an, Shannxi, P.R.China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087863930","display_name":"Guanwen Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanwen Zhang","raw_affiliation_strings":["Visual Intelligent Processing Laboratory, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, Shaanxi, China","School of Electronics and Information, Visual Intelligent Processing Laboratory, Northwestern Polytechnical University, Xi&#x2019;an, Shannxi, P.R.China"],"raw_orcid":"https://orcid.org/0000-0001-6036-4074","affiliations":[{"raw_affiliation_string":"Visual Intelligent Processing Laboratory, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"School of Electronics and Information, Visual Intelligent Processing Laboratory, Northwestern Polytechnical University, Xi&#x2019;an, Shannxi, P.R.China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004862851","display_name":"Zhengyun Cheng","orcid":"https://orcid.org/0000-0002-1003-4381"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhengyun Cheng","raw_affiliation_strings":["Visual Intelligent Processing Laboratory, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, Shaanxi, China","School of Electronics and Information, Visual Intelligent Processing Laboratory, Northwestern Polytechnical University, Xi&#x2019;an, Shannxi, P.R.China"],"raw_orcid":"https://orcid.org/0000-0002-1003-4381","affiliations":[{"raw_affiliation_string":"Visual Intelligent Processing Laboratory, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"School of Electronics and Information, Visual Intelligent Processing Laboratory, Northwestern Polytechnical University, Xi&#x2019;an, Shannxi, P.R.China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000288828","display_name":"Wei Zhou","orcid":"https://orcid.org/0000-0001-9715-6957"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Zhou","raw_affiliation_strings":["Visual Intelligent Processing Laboratory, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, Shaanxi, China","School of Electronics and Information, Visual Intelligent Processing Laboratory, Northwestern Polytechnical University, Xi&#x2019;an, Shannxi, P.R.China"],"raw_orcid":"https://orcid.org/0000-0001-9715-6957","affiliations":[{"raw_affiliation_string":"Visual Intelligent Processing Laboratory, School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"School of Electronics and Information, Visual Intelligent Processing Laboratory, Northwestern Polytechnical University, Xi&#x2019;an, Shannxi, P.R.China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":6.5446,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.96453712,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"35","issue":"6","first_page":"5762","last_page":"5775"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.8062934875488281},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.7699763774871826},{"id":"https://openalex.org/keywords/visual-odometry","display_name":"Visual odometry","score":0.7404592037200928},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6467404365539551},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6118230223655701},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5597639083862305},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4870014786720276},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.07374927401542664},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.07051661610603333},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.0633837878704071}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.8062934875488281},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.7699763774871826},{"id":"https://openalex.org/C5799516","wikidata":"https://www.wikidata.org/wiki/Q4110915","display_name":"Visual odometry","level":3,"score":0.7404592037200928},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6467404365539551},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6118230223655701},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5597639083862305},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4870014786720276},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.07374927401542664},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.07051661610603333},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.0633837878704071}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2025.3533256","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3533256","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2298402825","display_name":null,"funder_award_id":"2018AAA0102803","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G2761896105","display_name":null,"funder_award_id":"2018ZE53052","funder_id":"https://openalex.org/F4320336567","funder_display_name":"Natural Science Basic Research Program of Shaanxi Province"},{"id":"https://openalex.org/G3772749610","display_name":null,"funder_award_id":"61602383","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4712350512","display_name":null,"funder_award_id":"2021JM- 074","funder_id":"https://openalex.org/F4320336567","funder_display_name":"Natural Science Basic Research Program of Shaanxi Province"},{"id":"https://openalex.org/G4791232520","display_name":"\u9762\u5411\u8d85\u9ad8\u6e05\u89c6\u9891\u7f16\u89e3\u7801\u7684\u9ad8\u6548\u5b58\u50a8\u6280\u672f\u7814\u7a76","funder_award_id":"61772424","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7165284919","display_name":null,"funder_award_id":"2018AAA0102801","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G839588479","display_name":null,"funder_award_id":"61702418","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8704831294","display_name":null,"funder_award_id":"2021JM-074","funder_id":"https://openalex.org/F4320336567","funder_display_name":"Natural Science Basic Research Program of Shaanxi Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320336567","display_name":"Natural Science Basic Research Program of Shaanxi Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W612478963","https://openalex.org/W1612997784","https://openalex.org/W1861492603","https://openalex.org/W1970504153","https://openalex.org/W1979931042","https://openalex.org/W2033819227","https://openalex.org/W2085261163","https://openalex.org/W2102481828","https://openalex.org/W2117539524","https://openalex.org/W2133665775","https://openalex.org/W2150066425","https://openalex.org/W2194775991","https://openalex.org/W2474281075","https://openalex.org/W2520707372","https://openalex.org/W2535547924","https://openalex.org/W2558027072","https://openalex.org/W2564632156","https://openalex.org/W2609883120","https://openalex.org/W2798405286","https://openalex.org/W2890949887","https://openalex.org/W2895192073","https://openalex.org/W2962816904","https://openalex.org/W2963488291","https://openalex.org/W2963583471","https://openalex.org/W2967059695","https://openalex.org/W2968288611","https://openalex.org/W2981732213","https://openalex.org/W2985775862","https://openalex.org/W2990946490","https://openalex.org/W2995569955","https://openalex.org/W3034364596","https://openalex.org/W3034475171","https://openalex.org/W3035056458","https://openalex.org/W3091687063","https://openalex.org/W3128629208","https://openalex.org/W3138516171","https://openalex.org/W3145609993","https://openalex.org/W3162552392","https://openalex.org/W3173274332","https://openalex.org/W3174211490","https://openalex.org/W3180341139","https://openalex.org/W3200732573","https://openalex.org/W3204559841","https://openalex.org/W3206296944","https://openalex.org/W3211993773","https://openalex.org/W4214893857","https://openalex.org/W4214925515","https://openalex.org/W4285130569","https://openalex.org/W4295934562","https://openalex.org/W4312725059","https://openalex.org/W4312856322","https://openalex.org/W4320036904","https://openalex.org/W4321504701","https://openalex.org/W4361997638","https://openalex.org/W4381886216","https://openalex.org/W4385245566","https://openalex.org/W4386076019","https://openalex.org/W4387831730","https://openalex.org/W4393864956","https://openalex.org/W4399939213","https://openalex.org/W4401414068","https://openalex.org/W6631190155","https://openalex.org/W6685261749","https://openalex.org/W6735443497","https://openalex.org/W6767088534"],"related_works":["https://openalex.org/W3006563365","https://openalex.org/W4386394365","https://openalex.org/W2789602789","https://openalex.org/W2954249689","https://openalex.org/W2626414811","https://openalex.org/W4313484789","https://openalex.org/W2001736731","https://openalex.org/W2913604885","https://openalex.org/W4302306787","https://openalex.org/W4300939778"],"abstract_inverted_index":{"Monocular":[0],"visual":[1],"odometry":[2],"(VO)":[3],"is":[4],"crucial":[5],"for":[6,68,92,119],"the":[7,14,54,69,76,127,133,159],"application":[8],"of":[9],"various":[10],"autonomous":[11],"systems.":[12],"However,":[13],"inherent":[15],"scale":[16,85,94],"ambiguity":[17],"issue":[18],"in":[19,26,75,126],"monocular":[20,36,46,149],"methods":[21],"greatly":[22],"limits":[23],"their":[24],"performance":[25,154,169],"pose":[27,44,124],"estimation.":[28],"In":[29],"this":[30],"paper,":[31],"we":[32,58,97],"propose":[33,98],"a":[34,60,99,106],"hybrid":[35],"VO":[37],"system":[38,143,164],"named":[39],"KPDepth-VO,":[40],"which":[41],"solves":[42],"camera":[43],"from":[45,148],"video":[47],"based":[48],"on":[49,132,170],"sparse":[50],"keypoints.":[51],"To":[52],"estimate":[53],"scale-consistent":[55,146],"relative":[56],"pose,":[57],"present":[59],"novel":[61,100],"photometric-sensitive":[62],"depth":[63,70,90,160,167,172],"uncertainty":[64,71,91],"model":[65],"that":[66,88,109,141],"accounts":[67],"introduced":[72],"by":[73],"limitations":[74],"photometric":[77],"error":[78],"constraint.":[79],"We":[80],"also":[81],"introduce":[82],"an":[83],"uncertainty-aware":[84],"recovery":[86],"strategy":[87],"incorporates":[89],"reliable":[93],"alignment.":[95],"Additionally,":[96],"difference":[101],"attention":[102],"mechanism":[103],"to":[104],"construct":[105],"point":[107],"filter":[108],"effectively":[110],"filters":[111],"out":[112],"less":[113],"distinctive":[114],"points,":[115],"ensuring":[116],"high-quality":[117],"matches":[118],"more":[120],"accurate":[121],"and":[122,136,151],"efficient":[123],"estimation":[125,168],"proposed":[128],"system.":[129],"Experimental":[130],"results":[131],"KITTI":[134,171],"dataset":[135,139],"Oxford":[137],"Robotcar":[138],"demonstrate":[140],"our":[142,163],"can":[144],"predict":[145],"trajectories":[147],"videos":[150],"achieve":[152],"state-of-the-art":[153],"among":[155],"similar":[156],"methods.":[157],"Meanwhile,":[158],"network":[161],"within":[162],"achieves":[165],"competitive":[166],"benchmark.":[173]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":5}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
