{"id":"https://openalex.org/W4399425709","doi":"https://doi.org/10.1109/tase.2024.3409392","title":"Absolute Monocular Depth Estimation on Robotic Visual and Kinematics Data via Self-Supervised Learning","display_name":"Absolute Monocular Depth Estimation on Robotic Visual and Kinematics Data via Self-Supervised Learning","publication_year":2024,"publication_date":"2024-06-07","ids":{"openalex":"https://openalex.org/W4399425709","doi":"https://doi.org/10.1109/tase.2024.3409392"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2024.3409392","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3409392","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085059175","display_name":"Ruofeng Wei","orcid":"https://orcid.org/0000-0002-7071-4135"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Ruofeng Wei","raw_affiliation_strings":["Department of Biomedical Engineering, City University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Biomedical Engineering, City University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100365257","display_name":"Bin Li","orcid":"https://orcid.org/0000-0003-1684-8869"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Li","raw_affiliation_strings":["Department of Mechanical and Automation Engineering, The Chinese University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical and Automation Engineering, The Chinese University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010124359","display_name":"Fangxun Zhong","orcid":"https://orcid.org/0000-0002-1151-1995"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fangxun Zhong","raw_affiliation_strings":["Department of Mechanical and Automation Engineering, The Chinese University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical and Automation Engineering, The Chinese University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033077344","display_name":"Hangjie Mo","orcid":"https://orcid.org/0000-0001-8628-3838"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Hangjie Mo","raw_affiliation_strings":["Department of Biomedical Engineering, City University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Biomedical Engineering, City University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090516040","display_name":"Qi Dou","orcid":"https://orcid.org/0000-0002-3416-9950"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Dou","raw_affiliation_strings":["Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, The Chinese University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100707660","display_name":"Yunhui Liu","orcid":"https://orcid.org/0000-0002-3625-6679"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yun-Hui Liu","raw_affiliation_strings":["Department of Mechanical and Automation Engineering, The Chinese University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical and Automation Engineering, The Chinese University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100382905","display_name":"Dong Sun","orcid":"https://orcid.org/0000-0003-3945-4037"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Dong Sun","raw_affiliation_strings":["Department of Biomedical Engineering, City University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of Biomedical Engineering, City University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I168719708"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5085059175"],"corresponding_institution_ids":["https://openalex.org/I168719708"],"apc_list":null,"apc_paid":null,"fwci":3.5754,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.94000903,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"22","issue":null,"first_page":"4269","last_page":"4282"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10638","display_name":"Optical measurement and interference techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.700031578540802},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6908418536186218},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6649462580680847},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.6549742221832275},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5817238688468933},{"id":"https://openalex.org/keywords/monocular-vision","display_name":"Monocular vision","score":0.5235409736633301},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.4366745948791504},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.08074286580085754}],"concepts":[{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.700031578540802},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6908418536186218},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6649462580680847},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.6549742221832275},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5817238688468933},{"id":"https://openalex.org/C158829959","wikidata":"https://www.wikidata.org/wiki/Q1640606","display_name":"Monocular vision","level":2,"score":0.5235409736633301},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.4366745948791504},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.08074286580085754},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2024.3409392","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2024.3409392","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2051917483","display_name":null,"funder_award_id":"11211421","funder_id":"https://openalex.org/F4320334971","funder_display_name":"Science and Engineering Research Council"},{"id":"https://openalex.org/G4565189637","display_name":null,"funder_award_id":"T42-409/18-R","funder_id":"https://openalex.org/F4320334971","funder_display_name":"Science and Engineering Research Council"},{"id":"https://openalex.org/G818396220","display_name":null,"funder_award_id":"62322318","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334971","display_name":"Science and Engineering Research Council","ror":"https://ror.org/00zgdb249"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1821462560","https://openalex.org/W2125188192","https://openalex.org/W2133665775","https://openalex.org/W2194775991","https://openalex.org/W2471962767","https://openalex.org/W2527142681","https://openalex.org/W2543539599","https://openalex.org/W2563705555","https://openalex.org/W2609883120","https://openalex.org/W2801997348","https://openalex.org/W2955639361","https://openalex.org/W2958981985","https://openalex.org/W2963073614","https://openalex.org/W2972124618","https://openalex.org/W2985775862","https://openalex.org/W2989184872","https://openalex.org/W3012355143","https://openalex.org/W3081167590","https://openalex.org/W3096678291","https://openalex.org/W3112952488","https://openalex.org/W3152803807","https://openalex.org/W3179159099","https://openalex.org/W3194607169","https://openalex.org/W3207523613","https://openalex.org/W3214071647","https://openalex.org/W4200072305","https://openalex.org/W4210453703","https://openalex.org/W4210582445","https://openalex.org/W4214520160","https://openalex.org/W4229439973","https://openalex.org/W4235876038","https://openalex.org/W4288751198","https://openalex.org/W4296197038","https://openalex.org/W4298129340","https://openalex.org/W4312995760","https://openalex.org/W4383109137","https://openalex.org/W6743188669","https://openalex.org/W6787724516"],"related_works":["https://openalex.org/W3213413335","https://openalex.org/W3213997683","https://openalex.org/W2736638679","https://openalex.org/W4307623796","https://openalex.org/W2995270189","https://openalex.org/W4313046826","https://openalex.org/W4394784820","https://openalex.org/W1968716783","https://openalex.org/W2084124712","https://openalex.org/W2435467664"],"abstract_inverted_index":{"Accurate":[0,260],"estimation":[1,103,186,245,311,341],"of":[2,167,221,241,266,275,290,312,335],"absolute":[3,61,134,227,242,309,339,346],"depth":[4,34,62,90,102,131,135,185,228,244,261,289,310,340,347],"from":[5,122,255],"a":[6,10,47,75,88,109,302],"monocular":[7,28,64,230,243,268,295,313,343],"endoscope":[8],"is":[9,96,106,170,270],"fundamental":[11],"task":[12],"for":[13,63,137,191,272,338],"automatic":[14,247,279,356],"navigation":[15,249,357],"systems":[16],"in":[17,81,108,246,278,359],"robotic":[18,189],"surgery.":[19],"Previous":[20],"works":[21],"solely":[22],"rely":[23],"on":[24,93,195,342],"uni-modal":[25],"data":[26,187,200,254,320],"(i.e.,":[27],"images),":[29],"which":[30,51],"can":[31,284,350],"only":[32,285],"estimate":[33,58],"values":[35],"arbitrarily":[36],"scaled":[37],"with":[38,150,211,229,263],"the":[39,59,70,82,85,100,120,127,143,148,165,173,203,219,226,239,252,256,267,273,287,291,330,355,360],"real":[40,264],"world.":[41],"In":[42,84,142,175,297],"this":[43,298],"paper,":[44],"we":[45,73,113,146,177,300],"present":[46],"novel":[48],"framework,":[49],"SADER,":[50],"explores":[52],"vision":[53,94],"and":[54,129,198,332],"robot":[55,123],"kinematics":[56],"to":[57,98,117,162,181,224,233,237,306],"high-quality":[60,308],"surgical":[65,184,248,276,292],"scenes.":[66],"To":[67,157],"jointly":[68],"learn":[69],"multi-modal":[71,253],"data,":[72,132],"introduce":[74],"self-distillation":[76],"based":[77,92],"two-stage":[78],"training":[79],"policy":[80],"framework.":[83],"first":[86],"stage,":[87,145],"boosting":[89],"module":[91],"transformer":[95],"proposed":[97],"improve":[99],"relative":[101,130,288],"network":[104,149],"that":[105,202],"trained":[107],"self-supervised":[110,303],"method.":[111],"Then,":[112],"develop":[114],"an":[115,212],"algorithm":[116],"automatically":[118],"compute":[119],"scale":[121,128],"kinematics.":[124],"By":[125],"coupling":[126],"pseudo":[133,155],"labels":[136],"all":[138],"images":[139],"are":[140],"yielded.":[141],"second":[144],"re-train":[147],"3D":[151],"loss":[152],"supervised":[153],"by":[154,250],"labels.":[156],"make":[158],"our":[159,222,336],"method":[160,305],"generalize":[161],"different":[163],"endoscopes,":[164],"learning":[166],"endoscopic":[168,258,314],"intrinsics":[169],"integrated":[171],"into":[172,354],"network.":[174],"addition,":[176],"did":[178],"cadaver":[179,199],"experiments":[180,327],"collect":[182],"new":[183],"about":[188],"laparoscopy":[190],"evaluation.":[192],"Experimental":[193],"results":[194],"public":[196],"SCARED":[197],"demonstrate":[201],"SADER":[204],"outperforms":[205],"previous":[206],"state-of-art":[207],"even":[208],"stereo-based":[209],"methods":[210,283],"accuracy":[213],"error":[214],"under":[215],"1.90":[216],"mm,":[217],"proving":[218],"feasibility":[220,331],"approach":[223],"recover":[225],"inputs.":[231],"Note":[232],"Practitioners\u2014This":[234],"paper":[235],"aims":[236],"solve":[238],"problem":[240],"leveraging":[251],"robot-based":[257],"system.":[259],"perception":[262,348],"scales":[265],"scene":[269,293],"essential":[271],"control":[274],"robots":[277],"navigation.":[280],"However,":[281],"current":[282],"predict":[286],"using":[294],"images.":[296,315],"article,":[299],"propose":[301],"learning-based":[304],"achieve":[307],"It":[316],"neither":[317],"needs":[318],"manual":[319],"annotation,":[321],"nor":[322],"other":[323],"imaging":[324],"modalities.":[325],"The":[326],"extensively":[328],"validate":[329],"high":[333],"performance":[334],"framework":[337,349],"endoscopes.":[344],"This":[345],"be":[351],"potentially":[352],"encapsulated":[353],"system":[358],"near":[361],"future.":[362]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
