{"id":"https://openalex.org/W3001179317","doi":"https://doi.org/10.1109/vcip47243.2019.8965952","title":"DVONet: Unsupervised Monocular Depth Estimation and Visual Odometry","display_name":"DVONet: Unsupervised Monocular Depth Estimation and Visual Odometry","publication_year":2019,"publication_date":"2019-12-01","ids":{"openalex":"https://openalex.org/W3001179317","doi":"https://doi.org/10.1109/vcip47243.2019.8965952","mag":"3001179317"},"language":"en","primary_location":{"id":"doi:10.1109/vcip47243.2019.8965952","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip47243.2019.8965952","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100460327","display_name":"Xiangyu Li","orcid":"https://orcid.org/0000-0003-0094-8865"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiangyu Li","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023247075","display_name":"Yonghong Hou","orcid":"https://orcid.org/0000-0002-1676-5505"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yonghong Hou","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075668011","display_name":"Qi Wu","orcid":"https://orcid.org/0000-0002-1196-226X"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Wu","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042680345","display_name":"Pichao Wang","orcid":"https://orcid.org/0000-0002-1430-0237"},"institutions":[{"id":"https://openalex.org/I4210095624","display_name":"Alibaba Group (United States)","ror":"https://ror.org/00rn0m335","country_code":"US","type":"company","lineage":["https://openalex.org/I4210095624","https://openalex.org/I45928872"]},{"id":"https://openalex.org/I4210108985","display_name":"Bellevue Hospital Center","ror":"https://ror.org/01ky34z31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1283621791","https://openalex.org/I4210086933","https://openalex.org/I4210108985"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pichao Wang","raw_affiliation_strings":["Alibaba Group (U.S.) Inc., Bellevue, WA, USA"],"affiliations":[{"raw_affiliation_string":"Alibaba Group (U.S.) Inc., Bellevue, WA, USA","institution_ids":["https://openalex.org/I4210095624","https://openalex.org/I4210108985"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100695040","display_name":"Wanqing Li","orcid":"https://orcid.org/0000-0002-4427-2687"},"institutions":[{"id":"https://openalex.org/I204824540","display_name":"University of Wollongong","ror":"https://ror.org/00jtmb277","country_code":"AU","type":"education","lineage":["https://openalex.org/I204824540"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Wanqing Li","raw_affiliation_strings":["Advanced Multimedia Research Lab, University of Wollongong, Australia"],"affiliations":[{"raw_affiliation_string":"Advanced Multimedia Research Lab, University of Wollongong, Australia","institution_ids":["https://openalex.org/I204824540"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100460327"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":0.5111,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.70743666,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"2019","issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.8689702749252319},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.8459798097610474},{"id":"https://openalex.org/keywords/visual-odometry","display_name":"Visual odometry","score":0.7960377335548401},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7243313193321228},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7209841012954712},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5131979584693909},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.5023586750030518},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.4777609407901764},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4681459069252014},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3440425992012024},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.33979639410972595},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.16252845525741577}],"concepts":[{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.8689702749252319},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.8459798097610474},{"id":"https://openalex.org/C5799516","wikidata":"https://www.wikidata.org/wiki/Q4110915","display_name":"Visual odometry","level":3,"score":0.7960377335548401},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7243313193321228},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7209841012954712},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5131979584693909},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.5023586750030518},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.4777609407901764},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4681459069252014},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3440425992012024},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.33979639410972595},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.16252845525741577},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/vcip47243.2019.8965952","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip47243.2019.8965952","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"},{"id":"pmh:oai:ro.uow.edu.au:eispapers1-4751","is_oa":false,"landing_page_url":"https://ro.uow.edu.au/eispapers1/3725","pdf_url":null,"source":{"id":"https://openalex.org/S4306400510","display_name":"Research Online (University of Wollongong)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I204824540","host_organization_name":"University of Wollongong","host_organization_lineage":["https://openalex.org/I204824540"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Faculty of Engineering and Information Sciences - Papers: Part B","raw_type":"presentation"},{"id":"mag:3091052310","is_oa":false,"landing_page_url":"https://jglobal.jst.go.jp/en/detail?JGLOBAL_ID=202002292184320916","pdf_url":null,"source":{"id":"https://openalex.org/S4306512817","display_name":"IEEE Conference Proceedings","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"IEEE Conference Proceedings","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W603908379","https://openalex.org/W1612997784","https://openalex.org/W2115579991","https://openalex.org/W2125416623","https://openalex.org/W2133665775","https://openalex.org/W2171740948","https://openalex.org/W2300779272","https://openalex.org/W2520707372","https://openalex.org/W2598706937","https://openalex.org/W2609883120","https://openalex.org/W2951234442","https://openalex.org/W2962816904","https://openalex.org/W2963583471","https://openalex.org/W2964314455","https://openalex.org/W3103648783","https://openalex.org/W3106440972","https://openalex.org/W6618372016","https://openalex.org/W6685261749"],"related_works":["https://openalex.org/W4386394365","https://openalex.org/W3006563365","https://openalex.org/W2954249689","https://openalex.org/W2001736731","https://openalex.org/W2626414811","https://openalex.org/W4302306787","https://openalex.org/W2913604885","https://openalex.org/W4313484789","https://openalex.org/W3045795527","https://openalex.org/W4300939778"],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"an":[3],"unsupervised":[4,103],"learning":[5],"framework":[6,20],"for":[7,88],"monocular":[8,39],"depth":[9,34,53,90],"estimation":[10,77,91],"and":[11,27,35,50,78,92,105],"visual":[12],"odometry":[13],"(VO),":[14],"referred":[15],"to":[16,30,108],"as":[17],"DVONet.":[18],"The":[19,82],"is":[21,28,58,66,73],"trained":[22],"using":[23],"stereo":[24,46],"image":[25],"sequences":[26],"able":[29],"estimate":[31],"absolute-scale":[32],"scene":[33],"camera":[36],"poses":[37],"from":[38],"images.":[40],"To":[41],"mitigate":[42],"the":[43,52,69,96,101,109],"effect":[44],"of":[45],"occlusions":[47],"in":[48],"training":[49],"improve":[51],"estimation,":[54],"left-right":[55],"occlusion":[56],"mask":[57],"introduced.":[59],"In":[60],"addition,":[61],"a":[62],"novel":[63],"VO":[64,93],"network":[65,72],"proposed":[67,83],"where":[68],"feature":[70],"extraction":[71],"shared":[74],"between":[75],"pose":[76],"optical":[79],"flow":[80],"estimation.":[81],"DVONet":[84],"achieves":[85],"state-of-the-art":[86],"results":[87],"both":[89],"tasks":[94],"on":[95],"KITTI":[97],"driving":[98],"dataset,":[99],"outperforming":[100],"existing":[102],"methods":[104],"being":[106],"comparable":[107],"traditional":[110],"ones.":[111]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
