{"id":"https://openalex.org/W4404914305","doi":"https://doi.org/10.1109/tcsvt.2024.3509619","title":"MonoDiffusion: Self-Supervised Monocular Depth Estimation Using Diffusion Model","display_name":"MonoDiffusion: Self-Supervised Monocular Depth Estimation Using Diffusion Model","publication_year":2024,"publication_date":"2024-12-02","ids":{"openalex":"https://openalex.org/W4404914305","doi":"https://doi.org/10.1109/tcsvt.2024.3509619"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3509619","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3509619","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000411800","display_name":"Shuwei Shao","orcid":"https://orcid.org/0000-0001-8057-1599"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuwei Shao","raw_affiliation_strings":["School of Automation Science and Electrical Engineering, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8057-1599","affiliations":[{"raw_affiliation_string":"School of Automation Science and Electrical Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076604839","display_name":"Zhongcai Pei","orcid":"https://orcid.org/0000-0001-7748-8591"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhongcai Pei","raw_affiliation_strings":["School of Automation Science and Electrical Engineering, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7748-8591","affiliations":[{"raw_affiliation_string":"School of Automation Science and Electrical Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026365889","display_name":"Weihai Chen","orcid":"https://orcid.org/0000-0001-7912-4505"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weihai Chen","raw_affiliation_strings":["School of Automation Science and Electrical Engineering, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7912-4505","affiliations":[{"raw_affiliation_string":"School of Automation Science and Electrical Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070136304","display_name":"Dingchi Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dingchi Sun","raw_affiliation_strings":["School of Automation Science and Electrical Engineering, Beihang University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Automation Science and Electrical Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017988774","display_name":"Peter C. Y. Chen","orcid":"https://orcid.org/0000-0003-4851-9875"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Peter C. Y. Chen","raw_affiliation_strings":["Department of Mechanical Engineering, National University of Singapore, Cluny Road, Singapore","Department of Mechanical Engineering, National University of Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-4851-9875","affiliations":[{"raw_affiliation_string":"Department of Mechanical Engineering, National University of Singapore, Cluny Road, Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"Department of Mechanical Engineering, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100700917","display_name":"Zhengguo Li","orcid":"https://orcid.org/0000-0002-4525-1204"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zhengguo Li","raw_affiliation_strings":["VI Department, Institute for Infocomm Research, A*STAR, Fusionopolis, Singapore","VI department, Institute for Infocomm Research, A*STAR, 1 Fusionopolis Way, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-4525-1204","affiliations":[{"raw_affiliation_string":"VI Department, Institute for Infocomm Research, A*STAR, Fusionopolis, Singapore","institution_ids":["https://openalex.org/I3005327000"]},{"raw_affiliation_string":"VI department, Institute for Infocomm Research, A*STAR, 1 Fusionopolis Way, Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.5548,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.95945205,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"35","issue":"4","first_page":"3664","last_page":"3678"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10638","display_name":"Optical measurement and interference techniques","score":0.9453999996185303,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10638","display_name":"Optical measurement and interference techniques","score":0.9453999996185303,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.6936912536621094},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6166560649871826},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5921373963356018},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5459247827529907},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.491699755191803},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.41066765785217285},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40237540006637573}],"concepts":[{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.6936912536621094},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6166560649871826},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5921373963356018},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5459247827529907},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.491699755191803},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.41066765785217285},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40237540006637573},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2024.3509619","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3509619","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4137382365","display_name":null,"funder_award_id":"2024C03042","funder_id":"https://openalex.org/F8142712028","funder_display_name":"Key Research and Development Program of Zhejiang Province"},{"id":"https://openalex.org/G558676831","display_name":null,"funder_award_id":"61620106012","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6300563505","display_name":null,"funder_award_id":"2021C03050","funder_id":"https://openalex.org/F8142712028","funder_display_name":"Key Research and Development Program of Zhejiang Province"},{"id":"https://openalex.org/G6686779602","display_name":null,"funder_award_id":"62333023","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G938713618","display_name":null,"funder_award_id":"M23L7b0021","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F8142712028","display_name":"Key Research and Development Program of Zhejiang Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":96,"referenced_works":["https://openalex.org/W2099940712","https://openalex.org/W2108598243","https://openalex.org/W2132947399","https://openalex.org/W2133665775","https://openalex.org/W2150066425","https://openalex.org/W2194775991","https://openalex.org/W2520707372","https://openalex.org/W2609883120","https://openalex.org/W2803168974","https://openalex.org/W2890949887","https://openalex.org/W2948647700","https://openalex.org/W2962741876","https://openalex.org/W2962960377","https://openalex.org/W2963265330","https://openalex.org/W2963316641","https://openalex.org/W2963488291","https://openalex.org/W2963583471","https://openalex.org/W2963591054","https://openalex.org/W2963654727","https://openalex.org/W2964968086","https://openalex.org/W2985775862","https://openalex.org/W2990946490","https://openalex.org/W3034428934","https://openalex.org/W3034604951","https://openalex.org/W3035056458","https://openalex.org/W3035434014","https://openalex.org/W3035574324","https://openalex.org/W3107156787","https://openalex.org/W3118453581","https://openalex.org/W3152863269","https://openalex.org/W3155072588","https://openalex.org/W3162552392","https://openalex.org/W3173274332","https://openalex.org/W3173727695","https://openalex.org/W3174581459","https://openalex.org/W3194533273","https://openalex.org/W3194822352","https://openalex.org/W3203943632","https://openalex.org/W3204559841","https://openalex.org/W3212516020","https://openalex.org/W4206545998","https://openalex.org/W4281677543","https://openalex.org/W4283392354","https://openalex.org/W4292829030","https://openalex.org/W4312819733","https://openalex.org/W4312933868","https://openalex.org/W4313156423","https://openalex.org/W4321512633","https://openalex.org/W4322616103","https://openalex.org/W4376481259","https://openalex.org/W4382450646","https://openalex.org/W4382467380","https://openalex.org/W4386075593","https://openalex.org/W4386076206","https://openalex.org/W4386076215","https://openalex.org/W4386280799","https://openalex.org/W4390871795","https://openalex.org/W4390872010","https://openalex.org/W4390872147","https://openalex.org/W4390872705","https://openalex.org/W4390873435","https://openalex.org/W4402753888","https://openalex.org/W4402961751","https://openalex.org/W6618372016","https://openalex.org/W6679045638","https://openalex.org/W6685261749","https://openalex.org/W6726497184","https://openalex.org/W6746200908","https://openalex.org/W6757555829","https://openalex.org/W6757817989","https://openalex.org/W6765775151","https://openalex.org/W6767088534","https://openalex.org/W6771531989","https://openalex.org/W6779823529","https://openalex.org/W6783713337","https://openalex.org/W6786375611","https://openalex.org/W6795288823","https://openalex.org/W6797359156","https://openalex.org/W6804703708","https://openalex.org/W6804811285","https://openalex.org/W6805335523","https://openalex.org/W6805547681","https://openalex.org/W6809885388","https://openalex.org/W6810940779","https://openalex.org/W6811234694","https://openalex.org/W6838639034","https://openalex.org/W6844133118","https://openalex.org/W6844223692","https://openalex.org/W6846598164","https://openalex.org/W6846611385","https://openalex.org/W6850292659","https://openalex.org/W6850311292","https://openalex.org/W6850556344","https://openalex.org/W6853818442","https://openalex.org/W6863243049","https://openalex.org/W6872947455"],"related_works":["https://openalex.org/W200819717","https://openalex.org/W2032269556","https://openalex.org/W1991834176","https://openalex.org/W2944448661","https://openalex.org/W2064421702","https://openalex.org/W4253756925","https://openalex.org/W2805523177","https://openalex.org/W2131956013","https://openalex.org/W2036566443","https://openalex.org/W2081241816"],"abstract_inverted_index":{"Over":[0],"the":[1,59,78,123,133,137,142,157,180],"past":[2],"few":[3],"years,":[4],"self-supervised":[5,52,66,170],"monocular":[6,53],"depth":[7,54,60,118,143],"estimation":[8],"has":[9,136],"received":[10],"widespread":[11],"attention.":[12],"Most":[13],"efforts":[14],"focus":[15],"on":[16,156],"designing":[17],"different":[18],"types":[19],"of":[20,83,126,139],"network":[21],"architectures":[22],"and":[23,33,43,160],"loss":[24],"functions":[25],"or":[26,106],"handling":[27],"edge":[28],"cases,":[29],"for":[30,51,80,99],"example,":[31],"occlusion":[32],"dynamic":[34],"objects.":[35],"In":[36],"this":[37],"work,":[38],"we":[39,68,90,111],"take":[40],"another":[41],"path":[42],"propose":[44],"a":[45,65,70,86,94,113],"novel":[46],"conditional":[47],"diffusion-based":[48],"generative":[49],"framework":[50],"estimation,":[55],"dubbed":[56],"MonoDiffusion.":[57],"Because":[58],"ground-truth":[61,73],"is":[62,129,146],"unavailable":[63],"in":[64,93,151],"setting,":[67],"develop":[69,112],"new":[71],"pseudo":[72],"diffusion":[74,79,92],"process":[75],"to":[76,121,148],"assist":[77],"training.":[81],"Instead":[82],"diffusing":[84],"at":[85],"fixed":[87],"high":[88],"resolution,":[89],"perform":[91],"coarse-to-fine":[95],"manner":[96],"that":[97,132,145,164],"allows":[98],"faster":[100],"inference":[101],"time":[102],"without":[103],"sacrificing":[104],"accuracy":[105],"even":[107],"better":[108],"accuracy.":[109],"Furthermore,":[110],"simple":[114],"yet":[115],"effective":[116],"contrastive":[117],"reconstruction":[119],"mechanism":[120],"enhance":[122],"denoising":[124],"ability":[125],"model.":[127],"It":[128],"worth":[130],"noting":[131],"proposed":[134],"MonoDiffusion":[135,166],"property":[138],"naturally":[140],"acquiring":[141],"uncertainty":[144],"essential":[147],"be":[149,176],"implemented":[150],"safety-critical":[152],"cases.":[153],"Extensive":[154],"experiments":[155],"KITTI,":[158],"Make3D":[159],"DIML":[161],"datasets":[162],"indicate":[163],"our":[165],"outperforms":[167],"prior":[168],"state-of-the-art":[169],"competitors.":[171],"The":[172],"source":[173],"code":[174],"will":[175],"publicly":[177],"available":[178],"upon":[179],"acceptance.":[181]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-16T09:24:06.705377","created_date":"2025-10-10T00:00:00"}
