{"id":"https://openalex.org/W4379806231","doi":"https://doi.org/10.1145/3591106.3592264","title":"Towards Practical Consistent Video Depth Estimation","display_name":"Towards Practical Consistent Video Depth Estimation","publication_year":2023,"publication_date":"2023-06-08","ids":{"openalex":"https://openalex.org/W4379806231","doi":"https://doi.org/10.1145/3591106.3592264"},"language":"en","primary_location":{"id":"doi:10.1145/3591106.3592264","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3591106.3592264","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3591106.3592264","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 ACM International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3591106.3592264","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081639449","display_name":"Pengzhi Li","orcid":"https://orcid.org/0009-0005-4763-4320"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Pengzhi Li","raw_affiliation_strings":["Tsinghua University, China"],"raw_orcid":"https://orcid.org/0009-0005-4763-4320","affiliations":[{"raw_affiliation_string":"Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013886309","display_name":"Yikang Ding","orcid":"https://orcid.org/0000-0001-6916-9371"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yikang Ding","raw_affiliation_strings":["Tsinghua University, China"],"raw_orcid":"https://orcid.org/0000-0001-6916-9371","affiliations":[{"raw_affiliation_string":"Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102765423","display_name":"Linge Li","orcid":"https://orcid.org/0009-0008-3409-1875"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linge Li","raw_affiliation_strings":["Huawei, China"],"raw_orcid":"https://orcid.org/0009-0008-3409-1875","affiliations":[{"raw_affiliation_string":"Huawei, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102783736","display_name":"Jingwei Guan","orcid":"https://orcid.org/0009-0009-2302-2986"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingwei Guan","raw_affiliation_strings":["Huawei, China"],"raw_orcid":"https://orcid.org/0009-0009-2302-2986","affiliations":[{"raw_affiliation_string":"Huawei, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100765837","display_name":"Zhiheng Li","orcid":"https://orcid.org/0000-0002-1523-1114"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiheng Li","raw_affiliation_strings":["Tsinghua University, China"],"raw_orcid":"https://orcid.org/0000-0002-1523-1114","affiliations":[{"raw_affiliation_string":"Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5081639449"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.3532,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.57919397,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"388","last_page":"397"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10638","display_name":"Optical measurement and interference techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8334817886352539},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6541285514831543},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6232272982597351},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.5597742199897766},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.5485712289810181},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5085035562515259},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4706375300884247},{"id":"https://openalex.org/keywords/motion-estimation","display_name":"Motion estimation","score":0.43385428190231323},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.31116294860839844}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8334817886352539},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6541285514831543},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6232272982597351},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.5597742199897766},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.5485712289810181},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5085035562515259},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4706375300884247},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.43385428190231323},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.31116294860839844},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3591106.3592264","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3591106.3592264","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3591106.3592264","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 ACM International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3591106.3592264","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3591106.3592264","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3591106.3592264","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 ACM International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4379806231.pdf","grobid_xml":"https://content.openalex.org/works/W4379806231.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W125693051","https://openalex.org/W1513100184","https://openalex.org/W2021851106","https://openalex.org/W2040369854","https://openalex.org/W2117228865","https://openalex.org/W2150066425","https://openalex.org/W2300779272","https://openalex.org/W2470139095","https://openalex.org/W2471962767","https://openalex.org/W2520707372","https://openalex.org/W2609883120","https://openalex.org/W2798927139","https://openalex.org/W2886787375","https://openalex.org/W2887825894","https://openalex.org/W2890949887","https://openalex.org/W2942368658","https://openalex.org/W2945020349","https://openalex.org/W2956939277","https://openalex.org/W2962927978","https://openalex.org/W2963412495","https://openalex.org/W2963591054","https://openalex.org/W2963654727","https://openalex.org/W2963760790","https://openalex.org/W2964254721","https://openalex.org/W2964968086","https://openalex.org/W2982014906","https://openalex.org/W2982336692","https://openalex.org/W2985775862","https://openalex.org/W2996880115","https://openalex.org/W3035563424","https://openalex.org/W3048510980","https://openalex.org/W3060975791","https://openalex.org/W3081167590","https://openalex.org/W3094190932","https://openalex.org/W3102638728","https://openalex.org/W3111114371","https://openalex.org/W3174458495","https://openalex.org/W3174541782","https://openalex.org/W3175682855","https://openalex.org/W3182318349","https://openalex.org/W3182700213","https://openalex.org/W3183537987","https://openalex.org/W3208147236","https://openalex.org/W3215023725","https://openalex.org/W4200420145","https://openalex.org/W4214520160","https://openalex.org/W4289550868","https://openalex.org/W4312468718","https://openalex.org/W4313171699","https://openalex.org/W4313177683"],"related_works":["https://openalex.org/W200819717","https://openalex.org/W2032269556","https://openalex.org/W1991834176","https://openalex.org/W4386083130","https://openalex.org/W2944448661","https://openalex.org/W2064421702","https://openalex.org/W4253756925","https://openalex.org/W2030154815","https://openalex.org/W2051121715","https://openalex.org/W1929254672"],"abstract_inverted_index":{"Monocular":[0],"depth":[1,24,88,102,112,134,179,191],"estimation":[2,113,180,192],"algorithms":[3],"aim":[4],"to":[5,21,66,92,109,125,144,173],"explore":[6],"the":[7,34,38,83,97,127,146,161,168,175,199],"possible":[8],"links":[9],"between":[10],"2D":[11],"and":[12,33,50,70,86,99,115,189],"3D":[13],"data,":[14],"but":[15],"challenges":[16,69],"remain":[17],"for":[18,54,117,181],"existing":[19],"methods":[20,45],"predict":[22],"consistent":[23,132],"from":[25,96,151],"a":[26,62,76,130,152],"casual":[27,182],"video.":[28],"Relying":[29],"on":[30,75,156,186],"camera":[31],"poses":[32],"optical":[35],"flow":[36],"in":[37,47,121],"time-consuming":[39],"test-time":[40],"training":[41,135,147],"phases":[42],"makes":[43],"these":[44,68],"fail":[46],"many":[48],"scenarios":[49],"cannot":[51],"be":[52,107],"used":[53,116],"practical":[55],"applications.":[56],"In":[57,123],"this":[58,166],"work,":[59],"we":[60,140],"present":[61],"data-driven":[63,170],"post-processing":[64],"method":[65,81,172,197],"overcome":[67],"achieve":[71],"online":[72],"processing.":[73],"Based":[74],"deep":[77],"recurrent":[78],"network,":[79],"our":[80,164,196],"takes":[82],"adjacent":[84],"original":[85],"optimized":[87],"map":[89],"as":[90],"inputs":[91],"learn":[93],"temporal":[94,176],"consistency":[95,177],"dataset":[98,136,150],"achieves":[100],"higher":[101],"accuracy.":[103],"Our":[104],"approach":[105,143],"can":[106],"applied":[108],"multiple":[110],"single-frame":[111],"models":[114,193],"various":[118],"real-world":[119],"scenes":[120],"real-time.":[122],"addition,":[124],"tackle":[126],"lack":[128],"of":[129,137,163,178],"temporally":[131],"video":[133,148],"dynamic":[138],"scenes,":[139],"propose":[141],"an":[142],"generate":[145],"sequences":[149],"single":[153],"image":[154],"based":[155],"inferring":[157],"motion":[158],"field.":[159],"To":[160],"best":[162],"knowledge,":[165],"is":[167],"first":[169],"plug-and-play":[171],"improve":[174],"videos.":[183],"Extensive":[184],"experiments":[185],"three":[187,190],"datasets":[188],"show":[194],"that":[195],"outperforms":[198],"state-of-the-art":[200],"methods.":[201]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
