{"id":"https://openalex.org/W7164809715","doi":"https://doi.org/10.1145/3805622.3810594","title":"Geometry-Guided Depth Correction for Metric Relative Pose Estimation","display_name":"Geometry-Guided Depth Correction for Metric Relative Pose Estimation","publication_year":2026,"publication_date":"2026-06-15","ids":{"openalex":"https://openalex.org/W7164809715","doi":"https://doi.org/10.1145/3805622.3810594"},"language":null,"primary_location":{"id":"doi:10.1145/3805622.3810594","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810594","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3805622.3810594","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5138629337","display_name":"Shibin Xie","orcid":"https://orcid.org/0009-0006-8888-151X"},"institutions":[{"id":"https://openalex.org/I181326427","display_name":"Donghua University","ror":"https://ror.org/035psfh38","country_code":"CN","type":"education","lineage":["https://openalex.org/I181326427"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shibin Xie","raw_affiliation_strings":["Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0006-8888-151X","affiliations":[{"raw_affiliation_string":"Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I181326427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5138635304","display_name":"Hao Yin","orcid":"https://orcid.org/0009-0009-7609-5089"},"institutions":[{"id":"https://openalex.org/I181326427","display_name":"Donghua University","ror":"https://ror.org/035psfh38","country_code":"CN","type":"education","lineage":["https://openalex.org/I181326427"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Yin","raw_affiliation_strings":["Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0009-7609-5089","affiliations":[{"raw_affiliation_string":"Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I181326427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044656816","display_name":"S Y Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I181326427","display_name":"Donghua University","ror":"https://ror.org/035psfh38","country_code":"CN","type":"education","lineage":["https://openalex.org/I181326427"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuting Wang","raw_affiliation_strings":["Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0009-1206-4048","affiliations":[{"raw_affiliation_string":"Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I181326427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5138656601","display_name":"Xiaokang Fang","orcid":"https://orcid.org/0009-0006-5769-0104"},"institutions":[{"id":"https://openalex.org/I181326427","display_name":"Donghua University","ror":"https://ror.org/035psfh38","country_code":"CN","type":"education","lineage":["https://openalex.org/I181326427"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaokang Fang","raw_affiliation_strings":["Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0006-5769-0104","affiliations":[{"raw_affiliation_string":"Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I181326427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042518722","display_name":"Liang Jin","orcid":"https://orcid.org/0000-0002-7552-7849"},"institutions":[{"id":"https://openalex.org/I181326427","display_name":"Donghua University","ror":"https://ror.org/035psfh38","country_code":"CN","type":"education","lineage":["https://openalex.org/I181326427"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Jin","raw_affiliation_strings":["Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0008-5756-9114","affiliations":[{"raw_affiliation_string":"Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I181326427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5138642318","display_name":"Haotian Liu","orcid":"https://orcid.org/0009-0005-9733-1563"},"institutions":[{"id":"https://openalex.org/I181326427","display_name":"Donghua University","ror":"https://ror.org/035psfh38","country_code":"CN","type":"education","lineage":["https://openalex.org/I181326427"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haotian Liu","raw_affiliation_strings":["Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0005-9733-1563","affiliations":[{"raw_affiliation_string":"Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I181326427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100611270","display_name":"Yanting Zhang","orcid":"https://orcid.org/0000-0001-6317-1956"},"institutions":[{"id":"https://openalex.org/I181326427","display_name":"Donghua University","ror":"https://ror.org/035psfh38","country_code":"CN","type":"education","lineage":["https://openalex.org/I181326427"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanting Zhang","raw_affiliation_strings":["Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-6317-1956","affiliations":[{"raw_affiliation_string":"Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I181326427"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038044282","display_name":"Shen Cai","orcid":"https://orcid.org/0000-0001-5217-3155"},"institutions":[{"id":"https://openalex.org/I181326427","display_name":"Donghua University","ror":"https://ror.org/035psfh38","country_code":"CN","type":"education","lineage":["https://openalex.org/I181326427"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shen Cai","raw_affiliation_strings":["Donghua University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-5217-3155","affiliations":[{"raw_affiliation_string":"Donghua University, Shanghai, China","institution_ids":["https://openalex.org/I181326427"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.93407986,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1251","last_page":"1259"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.766700029373169,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.766700029373169,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.10790000110864639,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.03189999982714653,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.682200014591217},{"id":"https://openalex.org/keywords/ransac","display_name":"RANSAC","score":0.673799991607666},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6381999850273132},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5817000269889832},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.48489999771118164},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.46889999508857727},{"id":"https://openalex.org/keywords/differentiable-function","display_name":"Differentiable function","score":0.46160000562667847},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.38179999589920044}],"concepts":[{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.682200014591217},{"id":"https://openalex.org/C114744707","wikidata":"https://www.wikidata.org/wiki/Q218533","display_name":"RANSAC","level":3,"score":0.673799991607666},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6509000062942505},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6381999850273132},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5817000269889832},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5709999799728394},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.48980000615119934},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.48489999771118164},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.46889999508857727},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.46160000562667847},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.38179999589920044},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3817000091075897},{"id":"https://openalex.org/C23379248","wikidata":"https://www.wikidata.org/wiki/Q200904","display_name":"Epipolar geometry","level":3,"score":0.34209999442100525},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.32440000772476196},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3188999891281128},{"id":"https://openalex.org/C22100474","wikidata":"https://www.wikidata.org/wiki/Q4800952","display_name":"Articulated body pose estimation","level":4,"score":0.3068000078201294},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2964000105857849},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.28679999709129333},{"id":"https://openalex.org/C179458375","wikidata":"https://www.wikidata.org/wiki/Q1020763","display_name":"Bundle adjustment","level":3,"score":0.2768999934196472},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.2678999900817871},{"id":"https://openalex.org/C2986492983","wikidata":"https://www.wikidata.org/wiki/Q861092","display_name":"Image matching","level":3,"score":0.2624000012874603},{"id":"https://openalex.org/C3019007443","wikidata":"https://www.wikidata.org/wiki/Q568742","display_name":"3d model","level":2,"score":0.2535000145435333},{"id":"https://openalex.org/C158829959","wikidata":"https://www.wikidata.org/wiki/Q1640606","display_name":"Monocular vision","level":2,"score":0.2533999979496002},{"id":"https://openalex.org/C3020402766","wikidata":"https://www.wikidata.org/wiki/Q104376712","display_name":"Prior information","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3805622.3810594","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810594","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3805622.3810594","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810594","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W2200124539","https://openalex.org/W2620629206","https://openalex.org/W2905260191","https://openalex.org/W2955639361","https://openalex.org/W3034275286","https://openalex.org/W3138516171","https://openalex.org/W4390872507","https://openalex.org/W4402771002","https://openalex.org/W4413145529","https://openalex.org/W4413155527","https://openalex.org/W4413156343","https://openalex.org/W7160090332"],"related_works":[],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"Monocular":[3],"Depth":[4],"Estimation":[5],"(MDE)":[6],"has":[7],"evolved":[8],"from":[9,80],"predicting":[10],"affine-invariant":[11],"relative":[12,43,59,113],"depth":[13,25,54,88,98],"to":[14,69,91,109],"estimating":[15],"metric-scale":[16,58],"(absolute)":[17],"depth.":[18],"However,":[19],"local":[20,87],"geometric":[21,93],"inconsistencies":[22,29],"in":[23,39],"single-view":[24],"maps":[26],"and":[27,42,76,121,130],"scale":[28],"across":[30,132],"different":[31],"views":[32],"still":[33],"severely":[34],"hinder":[35],"their":[36],"practical":[37],"application":[38],"3D":[40],"matching":[41],"pose":[44,60,114],"estimation.":[45,61],"To":[46],"address":[47],"these":[48],"challenges,":[49],"we":[50],"propose":[51],"a":[52,86,105],"geometry-guided":[53],"correction":[55],"framework":[56,108],"for":[57],"Our":[62],"approach":[63],"first":[64],"leverages":[65],"pre-trained":[66],"foundation":[67],"models":[68],"extract":[70],"initial":[71],"metric":[72],"depth,":[73],"semi-dense":[74],"correspondences,":[75],"high-dimensional":[77],"semantic":[78],"features":[79],"dual-view":[81],"images.":[82],"We":[83],"then":[84],"introduce":[85],"refinement":[89],"module":[90],"correct":[92],"deviations.":[94],"Finally,":[95],"the":[96,112],"corrected":[97],"of":[99],"stereo-matched":[100],"pairs":[101],"is":[102],"integrated":[103],"into":[104],"differentiable":[106],"RANSAC":[107],"jointly":[110],"optimize":[111],"with":[115],"consistent":[116],"scale.":[117],"Experiments":[118],"on":[119],"ScanNet":[120],"7-Scenes":[122],"demonstrate":[123],"that":[124],"our":[125],"method":[126],"achieves":[127],"superior":[128],"performance":[129],"robustness":[131],"various":[133],"challenging":[134],"scenarios.":[135]},"counts_by_year":[],"updated_date":"2026-06-16T07:37:23.134862","created_date":"2026-06-16T00:00:00"}
