{"id":"https://openalex.org/W4416749458","doi":"https://doi.org/10.1109/iros60139.2025.11246835","title":"EndoMUST: Monocular Depth Estimation for Robotic Endoscopy via End-to-end Multi-step Self-supervised Training","display_name":"EndoMUST: Monocular Depth Estimation for Robotic Endoscopy via End-to-end Multi-step Self-supervised Training","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4416749458","doi":"https://doi.org/10.1109/iros60139.2025.11246835"},"language":null,"primary_location":{"id":"doi:10.1109/iros60139.2025.11246835","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11246835","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069326184","display_name":"Liangjing Shao","orcid":"https://orcid.org/0009-0009-9176-579X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Liangjing Shao","raw_affiliation_strings":["Fudan University,College of Biomedical Engineering"],"affiliations":[{"raw_affiliation_string":"Fudan University,College of Biomedical Engineering","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100976190","display_name":"Linxin Bai","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linxin Bai","raw_affiliation_strings":["Fudan University,College of Biomedical Engineering"],"affiliations":[{"raw_affiliation_string":"Fudan University,College of Biomedical Engineering","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101932246","display_name":"Cong Du","orcid":"https://orcid.org/0000-0002-8098-987X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenkang Du","raw_affiliation_strings":["Fudan University,College of Biomedical Engineering"],"affiliations":[{"raw_affiliation_string":"Fudan University,College of Biomedical Engineering","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049438049","display_name":"Xinrong Chen","orcid":"https://orcid.org/0009-0009-3706-2102"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinrong Chen","raw_affiliation_strings":["Fudan University,College of Biomedical Engineering"],"affiliations":[{"raw_affiliation_string":"Fudan University,College of Biomedical Engineering","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5069326184"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.37002468,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"7739","last_page":"7746"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.8639000058174133,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.8639000058174133,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.017400000244379044,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.011900000274181366,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.7773000001907349},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5325999855995178},{"id":"https://openalex.org/keywords/interference","display_name":"Interference (communication)","score":0.5041000247001648},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.43299999833106995},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.41519999504089355},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3962000012397766},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.38659998774528503},{"id":"https://openalex.org/keywords/depth-perception","display_name":"Depth perception","score":0.352400004863739}],"concepts":[{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.7773000001907349},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7150999903678894},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7017999887466431},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6887999773025513},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5325999855995178},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.5041000247001648},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.43299999833106995},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.41519999504089355},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3962000012397766},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.38659998774528503},{"id":"https://openalex.org/C52672216","wikidata":"https://www.wikidata.org/wiki/Q1749840","display_name":"Depth perception","level":3,"score":0.352400004863739},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.33219999074935913},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.2987000048160553},{"id":"https://openalex.org/C193581530","wikidata":"https://www.wikidata.org/wiki/Q683778","display_name":"Structured light","level":2,"score":0.29660001397132874},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.28999999165534973},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.28519999980926514},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.2793999910354614},{"id":"https://openalex.org/C106430172","wikidata":"https://www.wikidata.org/wiki/Q6002272","display_name":"Image restoration","level":4,"score":0.26669999957084656},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros60139.2025.11246835","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11246835","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309612","display_name":"Natural Science Foundation of Shanghai","ror":null},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W2770363598","https://openalex.org/W2962864875","https://openalex.org/W2963596017","https://openalex.org/W2964014680","https://openalex.org/W2985544790","https://openalex.org/W2989184872","https://openalex.org/W2991651424","https://openalex.org/W3044812225","https://openalex.org/W3152803807","https://openalex.org/W3179159099","https://openalex.org/W4200072305","https://openalex.org/W4229439973","https://openalex.org/W4282941808","https://openalex.org/W4321512633","https://openalex.org/W4377115383","https://openalex.org/W4386076206","https://openalex.org/W4390693694","https://openalex.org/W4396909933","https://openalex.org/W4402727359","https://openalex.org/W4403062944","https://openalex.org/W4404415442","https://openalex.org/W4404914305","https://openalex.org/W4406260671","https://openalex.org/W4408286403","https://openalex.org/W4415798746"],"related_works":[],"abstract_inverted_index":{"Monocular":[0],"depth":[1,71,142,149],"estimation":[2,5,72,143,150],"and":[3,12,17,25,38,66,108,147],"ego-motion":[4],"are":[6,57,119],"significant":[7],"tasks":[8],"for":[9,54,69],"scene":[10],"perception":[11],"navigation":[13],"in":[14,28,73,85],"stable,":[15],"accurate":[16],"efficient":[18,81],"robot-assisted":[19],"endoscopy.":[20,74],"To":[21],"tackle":[22],"lighting":[23],"variations":[24],"sparse":[26],"textures":[27],"endoscopic":[29],"scenes,":[30],"multiple":[31,55,109],"techniques":[32],"including":[33,101],"optical":[34,102],"flow,":[35],"appearance":[36],"flow":[37,103],"intrinsic":[39],"image":[40,106],"decomposition":[41,107],"have":[42],"been":[43,167],"introduced":[44],"into":[45,98],"the":[46,50,94,116,131,134],"existing":[47],"methods.":[48],"However,":[49],"effective":[51],"training":[52],"strategy":[53],"modules":[56],"still":[58],"critical":[59],"to":[60],"deal":[61],"with":[62,79,154],"both":[63],"illumination":[64],"issues":[65],"information":[67],"interference":[68,122],"self-supervised":[70,141],"Therefore,":[75],"a":[76],"novel":[77],"framework":[78],"multistep":[80],"finetuning":[82,129],"is":[83,96],"proposed":[84,135],"this":[86,164],"work.":[87],"In":[88],"each":[89,113],"epoch":[90],"of":[91,123,163],"end-to-end":[92],"training,":[93],"process":[95],"divided":[97],"three":[99],"steps,":[100],"registration,":[104],"multiscale":[105],"transformation":[110],"alignments.":[111],"At":[112],"step,":[114],"only":[115],"related":[117],"networks":[118],"trained":[120],"without":[121],"irrelevant":[124],"information.":[125],"Based":[126],"on":[127,130,140,144,151,169],"parameter-efficient":[128],"foundation":[132],"model,":[133],"method":[136],"achieves":[137],"state-of-the-art":[138],"performance":[139],"SCARED":[145],"dataset":[146],"zero-shot":[148],"Hamlyn":[152],"dataset,":[153],"4%":[155],"\u223c":[156],"10%":[157],"lower":[158],"error.":[159],"The":[160],"evaluation":[161],"code":[162],"work":[165],"has":[166],"published":[168],"https://github.com/BaymaxShao/EndoMUST.":[170]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-11-28T00:00:00"}
