{"id":"https://openalex.org/W7137888794","doi":"https://doi.org/10.1609/aaai.v40i6.42414","title":"AdaDepth: Exploiting Inherent Scene Information for Self-Supervised Depth Estimation in Dynamic Scenes","display_name":"AdaDepth: Exploiting Inherent Scene Information for Self-Supervised Depth Estimation in Dynamic Scenes","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7137888794","doi":"https://doi.org/10.1609/aaai.v40i6.42414"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i6.42414","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i6.42414","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/42414/46375","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/42414/46375","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125721340","display_name":"Xuanang Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xuanang Gao","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129735174","display_name":"Xiongbin Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiongbin Wu","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103200149","display_name":"Zhiwei Ning","orcid":"https://orcid.org/0009-0005-2294-6010"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiwei Ning","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101004131","display_name":"Runze Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]},{"id":"https://openalex.org/I99043593","display_name":"Macquarie University","ror":"https://ror.org/01sf06y89","country_code":"AU","type":"education","lineage":["https://openalex.org/I99043593"]}],"countries":["AU","CN"],"is_corresponding":false,"raw_author_name":"Runze Yang","raw_affiliation_strings":["Shanghai Jiao Tong University\nMacquarie University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University\nMacquarie University","institution_ids":["https://openalex.org/I99043593","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129658470","display_name":"Zhonglong Zheng","orcid":null},"institutions":[{"id":"https://openalex.org/I135237710","display_name":"Zhejiang Normal University","ror":"https://ror.org/01vevwk45","country_code":"CN","type":"education","lineage":["https://openalex.org/I135237710"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhonglong Zheng","raw_affiliation_strings":["Zhejiang Normal University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang Normal University","institution_ids":["https://openalex.org/I135237710"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129683497","display_name":"Jie Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Yang","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129679250","display_name":"Wei Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Liu","raw_affiliation_strings":["Shanghai Jiao Tong University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5125721340"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10944206,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"6","first_page":"4185","last_page":"4193"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9465000033378601,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9465000033378601,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.007400000002235174,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.006200000178068876,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.619700014591217},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5489000082015991},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.5145999789237976},{"id":"https://openalex.org/keywords/motion-estimation","display_name":"Motion estimation","score":0.4790000021457672},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.4699000120162964},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.45080000162124634},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.4296000003814697},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.3928999900817871}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7491000294685364},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.727400004863739},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6938999891281128},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.619700014591217},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5489000082015991},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.5145999789237976},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.4790000021457672},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4699000120162964},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.45080000162124634},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.4296000003814697},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3928999900817871},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.37540000677108765},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3522000014781952},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.3321000039577484},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.3257000148296356},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.31200000643730164},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.28949999809265137},{"id":"https://openalex.org/C146159030","wikidata":"https://www.wikidata.org/wiki/Q7625099","display_name":"Structure from motion","level":3,"score":0.2750000059604645},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.2687000036239624},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.2612000107765198},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i6.42414","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i6.42414","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/42414/46375","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i6.42414","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i6.42414","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/42414/46375","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","score":0.7946767807006836,"display_name":"Sustainable cities and communities"}],"awards":[{"id":"https://openalex.org/G1965710864","display_name":null,"funder_award_id":"24Z990200676","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2624907594","display_name":null,"funder_award_id":"62272419","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5623680443","display_name":null,"funder_award_id":"62376153","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7137888794.pdf","grobid_xml":"https://content.openalex.org/works/W7137888794.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Self-supervised":[0],"monocular":[1],"depth":[2,73,93,119,132,140],"estimation":[3,133],"methods":[4],"severely":[5],"compromise":[6],"accuracy":[7],"in":[8,134,142],"dynamic":[9,20,57,135,144],"objects":[10],"due":[11],"to":[12,41,124],"their":[13],"static":[14],"scene":[15,69,83,99],"assumption.":[16],"Existing":[17],"approaches":[18],"for":[19,56],"scenes":[21,145],"suffer":[22],"from":[23],"two":[24],"critical":[25],"shortcomings:":[26],"1)":[27],"reliance":[28],"on":[29,148,157],"supervised":[30],"segmentation":[31,153],"models":[32,40],"(requiring":[33],"costly":[34],"annotations)":[35],"or":[36,151],"computationally":[37],"intensive":[38],"multi-branch":[39],"isolate":[42],"moving":[43],"objects,":[44],"and":[45,71,95,108,121,127,160],"2)":[46],"simple":[47],"integration":[48],"of":[49,91,106],"2D/3D":[50],"motion":[51,109],"flow":[52],"without":[53,146],"reliable":[54],"supervision":[55],"objects.":[58],"We":[59],"propose":[60],"AdaDepth,":[61],"a":[62,92],"two\u2011stage":[63],"framework":[64],"that":[65],"jointly":[66],"performs":[67],"unsupervised":[68],"decomposition":[70,84],"dynamic-aware":[72],"learning.":[74],"In":[75,111],"the":[76,88,98,104,112,118],"initial":[77],"structural":[78],"stage,":[79,115],"our":[80],"geometry-motion":[81],"joint":[82],"(GMoDecomp)":[85],"module":[86],"ensures":[87],"robust":[89],"generation":[90],"prior":[94,120],"simultaneously":[96],"partitions":[97],"into":[100],"multiple":[101],"regions":[102,123],"through":[103],"fusion":[105],"geometric":[107],"cues.":[110],"region-adaptive":[113],"refinement":[114],"we":[116],"exploit":[117],"decomposed":[122],"introduce":[125],"motion-aware":[126],"geometry-consistent":[128],"constraints,":[129],"effectively":[130],"improving":[131],"scenes.":[136],"AdaDepth":[137],"achieves":[138],"accurate":[139],"prediction":[141],"highly":[143],"relying":[147],"external":[149],"labels":[150],"specialized":[152],"models.":[154],"Extensive":[155],"experiments":[156],"KITTI,":[158],"Cityscapes,":[159],"Waymo":[161],"Open":[162],"demonstrate":[163],"its":[164],"superiority":[165],"over":[166],"state-of-the-art":[167],"approaches.":[168]},"counts_by_year":[],"updated_date":"2026-05-21T09:19:25.381259","created_date":"2026-03-18T00:00:00"}
