{"id":"https://openalex.org/W4388185446","doi":"https://doi.org/10.1145/3581783.3612042","title":"Multi-Frame Self-Supervised Depth Estimation with Multi-Scale Feature Fusion in Dynamic Scenes","display_name":"Multi-Frame Self-Supervised Depth Estimation with Multi-Scale Feature Fusion in Dynamic Scenes","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4388185446","doi":"https://doi.org/10.1145/3581783.3612042"},"language":"en","primary_location":{"id":"doi:10.1145/3581783.3612042","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612042","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024302488","display_name":"Jiquan Zhong","orcid":"https://orcid.org/0000-0002-8558-4388"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiquan Zhong","raw_affiliation_strings":["Xiamen University, Xiamen, China"],"affiliations":[{"raw_affiliation_string":"Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026169938","display_name":"Xiaolin Huang","orcid":"https://orcid.org/0000-0003-4285-6520"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaolin Huang","raw_affiliation_strings":["Shanghai Jiao Tong University &amp; Key Laboratory of System Control and Information Processing, Ministry of Education of China, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University &amp; Key Laboratory of System Control and Information Processing, Ministry of Education of China, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100689641","display_name":"Xiao Yu","orcid":"https://orcid.org/0000-0003-2564-645X"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Yu","raw_affiliation_strings":["Xiamen University &amp; Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen, China"],"affiliations":[{"raw_affiliation_string":"Xiamen University &amp; Key Laboratory of Multimedia Trusted Perception and Efficient Computing, Ministry of Education of China, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5024302488"],"corresponding_institution_ids":["https://openalex.org/I191208505"],"apc_list":null,"apc_paid":null,"fwci":0.6018,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.69987708,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"2553","last_page":"2563"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10638","display_name":"Optical measurement and interference techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7974109649658203},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7592958211898804},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.641621470451355},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.6266776323318481},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6250358819961548},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.574732780456543},{"id":"https://openalex.org/keywords/fusion-mechanism","display_name":"Fusion mechanism","score":0.45018988847732544},{"id":"https://openalex.org/keywords/motion-estimation","display_name":"Motion estimation","score":0.4113558530807495},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3363193869590759},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.24256694316864014}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7974109649658203},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7592958211898804},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.641621470451355},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.6266776323318481},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6250358819961548},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.574732780456543},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.45018988847732544},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.4113558530807495},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3363193869590759},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.24256694316864014},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C103038307","wikidata":"https://www.wikidata.org/wiki/Q6556360","display_name":"Lipid bilayer fusion","level":3,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3581783.3612042","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612042","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G866175898","display_name":null,"funder_award_id":"62173283, 61977046","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1905829557","https://openalex.org/W1992989752","https://openalex.org/W2108134361","https://openalex.org/W2117248802","https://openalex.org/W2133665775","https://openalex.org/W2150066425","https://openalex.org/W2194775991","https://openalex.org/W2300779272","https://openalex.org/W2340897893","https://openalex.org/W2609883120","https://openalex.org/W2935854115","https://openalex.org/W2963316641","https://openalex.org/W2963583471","https://openalex.org/W2964968086","https://openalex.org/W2981732213","https://openalex.org/W2982102242","https://openalex.org/W2985775862","https://openalex.org/W2999905431","https://openalex.org/W3014641072","https://openalex.org/W3034307881","https://openalex.org/W3034428934","https://openalex.org/W3034604951","https://openalex.org/W3035056458","https://openalex.org/W3060975791","https://openalex.org/W3129944514","https://openalex.org/W3130403939","https://openalex.org/W3133929890","https://openalex.org/W3175682855","https://openalex.org/W3176063055","https://openalex.org/W3203073814","https://openalex.org/W3205269569","https://openalex.org/W4297845938","https://openalex.org/W4303449827","https://openalex.org/W4312386157","https://openalex.org/W4312398233","https://openalex.org/W4312572946","https://openalex.org/W4312856322"],"related_works":["https://openalex.org/W200819717","https://openalex.org/W2032269556","https://openalex.org/W2770593030","https://openalex.org/W2944448661","https://openalex.org/W2064421702","https://openalex.org/W1991834176","https://openalex.org/W4253756925","https://openalex.org/W2131956013","https://openalex.org/W4281727072","https://openalex.org/W4391053327"],"abstract_inverted_index":{"Monocular":[0],"depth":[1,23,29,36,56,98,117,142],"estimation":[2,57,118],"is":[3,42,73,111],"a":[4,34,104],"fundamental":[5],"task":[6],"in":[7,122],"computer":[8],"vision":[9],"and":[10,48,89,108],"multimedia.":[11],"The":[12,75,128],"self-supervised":[13],"learning":[14],"pipeline":[15],"makes":[16],"it":[17],"possible":[18],"to":[19],"train":[20],"the":[21,53,85,91,96,115,126,140],"monocular":[22],"network":[24,107],"with":[25,38,60,70,103],"no":[26],"need":[27],"of":[28,55,95],"labels.":[30],"In":[31],"this":[32],"paper,":[33],"multi-frame":[35,97,116,141],"model":[37],"multi-scale":[39],"feature":[40],"fusion":[41],"proposed":[43,133],"for":[44],"strengthening":[45],"texture":[46],"features":[47],"spatial-temporal":[49],"features,":[50],"which":[51,83,113],"improves":[52,114],"robustness":[54],"between":[58],"frames":[59],"large":[61],"camera":[62],"ego-motion.":[63],"A":[64],"novel":[65],"dynamic":[66,77],"object":[67],"detecting":[68],"method":[69],"geometry":[71],"explainability":[72],"proposed.":[74],"detected":[76],"objects":[78],"are":[79],"excluded":[80],"during":[81,125],"training,":[82],"guarantees":[84],"static":[86],"environment":[87],"assumption":[88],"relieves":[90],"accuracy":[92],"degradation":[93],"problem":[94],"estimation.":[99,143],"Robust":[100],"knowledge":[101],"distillation":[102],"consistent":[105],"teacher":[106],"reliability":[109],"guarantee":[110],"proposed,":[112],"without":[119],"an":[120],"increase":[121],"computation":[123],"complexity":[124],"test.":[127],"experiments":[129],"show":[130],"that":[131],"our":[132],"methods":[134],"achieve":[135],"great":[136],"performance":[137],"improvement":[138],"on":[139]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2023-11-02T00:00:00"}
