{"id":"https://openalex.org/W4226256580","doi":"https://doi.org/10.1109/tcsvt.2022.3215587","title":"3D Hierarchical Refinement and Augmentation for Unsupervised Learning of Depth and Pose From Monocular Video","display_name":"3D Hierarchical Refinement and Augmentation for Unsupervised Learning of Depth and Pose From Monocular Video","publication_year":2022,"publication_date":"2022-11-03","ids":{"openalex":"https://openalex.org/W4226256580","doi":"https://doi.org/10.1109/tcsvt.2022.3215587"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2022.3215587","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2022.3215587","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100336735","display_name":"Guangming Wang","orcid":"https://orcid.org/0000-0002-7675-543X"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guangming Wang","raw_affiliation_strings":["Department of Automation, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education, Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education, Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I1327237609","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiquan Zhong","orcid":"https://orcid.org/0000-0003-1785-7871"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiquan Zhong","raw_affiliation_strings":["Department of Automation, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education, Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education, Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I1327237609","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100298354","display_name":"Shijie Zhao","orcid":"https://orcid.org/0000-0002-8466-8061"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shijie Zhao","raw_affiliation_strings":["Department of Engineering Mechanics, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Engineering Mechanics, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053002998","display_name":"Wenhua Wu","orcid":"https://orcid.org/0000-0002-4045-9014"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenhua Wu","raw_affiliation_strings":["Department of Automation, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education, Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education, Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I1327237609","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100462338","display_name":"Zhe Liu","orcid":"https://orcid.org/0000-0001-6753-0303"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhe Liu","raw_affiliation_strings":["MOE Key Laboratory of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MOE Key Laboratory of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5107772128","display_name":"Hesheng Wang","orcid":"https://orcid.org/0000-0002-9959-1634"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hesheng Wang","raw_affiliation_strings":["Department of Automation, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education, Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education, Shanghai Engineering Research Center of Intelligent Control and Management, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I1327237609","https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100336735"],"corresponding_institution_ids":["https://openalex.org/I1327237609","https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03160626,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"33","issue":"4","first_page":"1776","last_page":"1786"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.8402508497238159},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7830398678779602},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.7813363075256348},{"id":"https://openalex.org/keywords/image-warping","display_name":"Image warping","score":0.726248562335968},{"id":"https://openalex.org/keywords/visual-odometry","display_name":"Visual odometry","score":0.725517988204956},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.7030601501464844},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6834980845451355},{"id":"https://openalex.org/keywords/depth-map","display_name":"Depth map","score":0.5315803289413452},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.518601655960083},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.4629652500152588},{"id":"https://openalex.org/keywords/view-synthesis","display_name":"View synthesis","score":0.45033177733421326},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3976028263568878},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.3154228925704956}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.8402508497238159},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7830398678779602},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.7813363075256348},{"id":"https://openalex.org/C157202957","wikidata":"https://www.wikidata.org/wiki/Q1659609","display_name":"Image warping","level":2,"score":0.726248562335968},{"id":"https://openalex.org/C5799516","wikidata":"https://www.wikidata.org/wiki/Q4110915","display_name":"Visual odometry","level":3,"score":0.725517988204956},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.7030601501464844},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6834980845451355},{"id":"https://openalex.org/C141268832","wikidata":"https://www.wikidata.org/wiki/Q2940499","display_name":"Depth map","level":3,"score":0.5315803289413452},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.518601655960083},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.4629652500152588},{"id":"https://openalex.org/C2776449333","wikidata":"https://www.wikidata.org/wiki/Q7928781","display_name":"View synthesis","level":3,"score":0.45033177733421326},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3976028263568878},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.3154228925704956},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2022.3215587","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2022.3215587","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1031521155","display_name":null,"funder_award_id":"U1913204","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1545384812","display_name":null,"funder_award_id":"62225309","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4785738499","display_name":null,"funder_award_id":"62073222","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5163237521","display_name":null,"funder_award_id":"U21A20480","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7399542710","display_name":null,"funder_award_id":"21511101900","funder_id":"https://openalex.org/F4320321885","funder_display_name":"Science and Technology Commission of Shanghai Municipality"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321885","display_name":"Science and Technology Commission of Shanghai Municipality","ror":"https://ror.org/03kt66j61"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W1803059841","https://openalex.org/W1990643921","https://openalex.org/W2002955990","https://openalex.org/W2012875423","https://openalex.org/W2105038642","https://openalex.org/W2115579991","https://openalex.org/W2133665775","https://openalex.org/W2150066425","https://openalex.org/W2300779272","https://openalex.org/W2520707372","https://openalex.org/W2535547924","https://openalex.org/W2582030122","https://openalex.org/W2593414960","https://openalex.org/W2609883120","https://openalex.org/W2784130972","https://openalex.org/W2788857104","https://openalex.org/W2886322387","https://openalex.org/W2890589396","https://openalex.org/W2890860133","https://openalex.org/W2890949887","https://openalex.org/W2950304854","https://openalex.org/W2962804601","https://openalex.org/W2962816904","https://openalex.org/W2963265330","https://openalex.org/W2963549785","https://openalex.org/W2963583471","https://openalex.org/W2963654727","https://openalex.org/W2963906250","https://openalex.org/W2964968086","https://openalex.org/W2966967866","https://openalex.org/W2967321219","https://openalex.org/W2969088625","https://openalex.org/W2982102242","https://openalex.org/W2985775862","https://openalex.org/W3007774126","https://openalex.org/W3014263713","https://openalex.org/W3034364596","https://openalex.org/W3034921716","https://openalex.org/W3035056458","https://openalex.org/W3096743677","https://openalex.org/W3107156787","https://openalex.org/W3108829545","https://openalex.org/W3109585842","https://openalex.org/W3118453581","https://openalex.org/W3128629208","https://openalex.org/W3132270109","https://openalex.org/W3145609993","https://openalex.org/W3153847062","https://openalex.org/W3162552392","https://openalex.org/W3165757908","https://openalex.org/W3167610791","https://openalex.org/W3173805712","https://openalex.org/W3175965986","https://openalex.org/W3176063055","https://openalex.org/W3176210901","https://openalex.org/W3204625264","https://openalex.org/W3212108214","https://openalex.org/W4214628039","https://openalex.org/W4226494925","https://openalex.org/W6631190155","https://openalex.org/W6685261749","https://openalex.org/W6767088534","https://openalex.org/W6785114638","https://openalex.org/W6785345353"],"related_works":["https://openalex.org/W10793771","https://openalex.org/W291087","https://openalex.org/W9584637","https://openalex.org/W16750289","https://openalex.org/W151830","https://openalex.org/W2758677","https://openalex.org/W1000462","https://openalex.org/W1938723","https://openalex.org/W7166613","https://openalex.org/W17583743"],"abstract_inverted_index":{"Depth":[0],"and":[1,9,14,27,48,59,64,81,94,110,185,205],"ego-motion":[2,28],"estimations":[3,61],"are":[4,62],"essential":[5],"for":[6,148],"the":[7,24,30,57,69,85,91,98,106,111,114,119,135,149,161,210],"localization":[8],"navigation":[10],"of":[11,113],"autonomous":[12,15],"robots":[13],"driving.":[16],"Recent":[17],"studies":[18],"make":[19],"it":[20],"possible":[21],"to":[22,67,117,209],"learn":[23],"per-pixel":[25],"depth":[26,58,93,180],"from":[29,105],"unlabeled":[31],"monocular":[32,202],"video.":[33],"In":[34,54],"this":[35,55,132],"paper,":[36,133],"a":[37,128,141,154,168],"novel":[38],"unsupervised":[39,201],"training":[40],"framework":[41,137],"is":[42,79,125,146],"proposed":[43,80,147],"with":[44,90,214],"3D":[45,52,164],"hierarchical":[46],"refinement":[47,124],"augmentation":[49,144],"using":[50],"explicit":[51],"geometry.":[53],"framework,":[56],"pose":[60,71,100,150,162],"hierarchically":[63],"mutually":[65],"coupled":[66],"refine":[68,118],"estimated":[70,92,104],"layer":[72],"by":[73,83,152],"layer.":[74],"The":[75,122,173,217],"intermediate":[76],"view":[77,108,156],"image":[78,89,109,112,143],"synthesized":[82],"warping":[84],"pixels":[86],"in":[87,127,131,163],"an":[88],"coarse":[95,120],"pose.":[96,121],"Then,":[97],"residual":[99],"transformation":[101],"can":[102],"be":[103,221],"new":[107,142,155,169],"adjacent":[115],"frame":[116],"iterative":[123],"implemented":[126],"differentiable":[129],"manner":[130],"making":[134],"whole":[136],"optimized":[138],"uniformly.":[139],"Meanwhile,":[140],"method":[145],"estimation":[151,181],"synthesizing":[153],"image,":[157],"which":[158],"creatively":[159],"augments":[160],"space":[165],"but":[166],"gets":[167],"augmented":[170],"2D":[171],"image.":[172],"experiments":[174],"on":[175],"KITTI":[176],"demonstrate":[177],"that":[178,190],"our":[179],"achieves":[182,206],"state-of-the-art":[183],"performance":[184,208],"even":[186],"surpasses":[187],"recent":[188,200],"approaches":[189],"utilize":[191],"other":[192],"auxiliary":[193],"tasks.":[194],"Our":[195],"visual":[196],"odometry":[197],"outperforms":[198],"all":[199],"learning-based":[203],"methods":[204],"competitive":[207],"geometry-based":[211],"method,":[212],"ORB-SLAM2":[213],"back-end":[215],"optimization.":[216],"source":[218],"codes":[219],"will":[220],"released":[222],"soon":[223],"at:":[224],"<uri":[225],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[226],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/IRMVLab/HRANet</uri>":[227],".":[228]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2022-05-05T00:00:00"}
