{"id":"https://openalex.org/W7133741206","doi":"https://doi.org/10.48550/arxiv.2603.03571","title":"Confidence-aware Monocular Depth Estimation for Minimally Invasive Surgery","display_name":"Confidence-aware Monocular Depth Estimation for Minimally Invasive Surgery","publication_year":2026,"publication_date":"2026-03-03","ids":{"openalex":"https://openalex.org/W7133741206","doi":"https://doi.org/10.48550/arxiv.2603.03571"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.03571","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128135597","display_name":"Muhammad Asad","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Asad, Muhammad","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003589624","display_name":"Emanuele Colleoni","orcid":"https://orcid.org/0000-0003-4614-5742"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Colleoni, Emanuele","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110735713","display_name":"Pritesh Mehta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mehta, Pritesh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128180968","display_name":"Nicolas Toussaint","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Toussaint, Nicolas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069643347","display_name":"Ricardo S\u00e1nchez-Matilla","orcid":"https://orcid.org/0000-0003-2330-0973"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sanchez-Matilla, Ricardo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004212009","display_name":"Maria Robu","orcid":"https://orcid.org/0000-0003-0106-0542"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Robu, Maria","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019352700","display_name":"Faisal Bashir","orcid":"https://orcid.org/0000-0003-2473-2575"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bashir, Faisal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128130110","display_name":"Rahim Mohammadi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mohammadi, Rahim","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Luengo, Imanol","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luengo, Imanol","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128140460","display_name":"Danail Stoyanov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stoyanov, Danail","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5128135597"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9506999850273132,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9506999850273132,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.008200000040233135,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.007199999876320362,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.6467999815940857},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5442000031471252},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5289000272750854},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4742000102996826},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.4415000081062317},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.4316999912261963},{"id":"https://openalex.org/keywords/confidence-interval","display_name":"Confidence interval","score":0.38909998536109924},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.383899986743927}],"concepts":[{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.6467999815940857},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.621999979019165},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5982999801635742},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5442000031471252},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5289000272750854},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.47620001435279846},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4742000102996826},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.4415000081062317},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.4316999912261963},{"id":"https://openalex.org/C44249647","wikidata":"https://www.wikidata.org/wiki/Q208498","display_name":"Confidence interval","level":2,"score":0.38909998536109924},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.383899986743927},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.36410000920295715},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.3357999920845032},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.32919999957084656},{"id":"https://openalex.org/C122048520","wikidata":"https://www.wikidata.org/wiki/Q2913954","display_name":"Percentile","level":2,"score":0.32440000772476196},{"id":"https://openalex.org/C202799725","wikidata":"https://www.wikidata.org/wiki/Q272035","display_name":"Accuracy and precision","level":2,"score":0.3077000081539154},{"id":"https://openalex.org/C167928553","wikidata":"https://www.wikidata.org/wiki/Q1376021","display_name":"Estimation theory","level":2,"score":0.2847999930381775},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.28119999170303345},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.2741999924182892},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.26910001039505005},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.25679999589920044}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.03571","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.03571","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.03571","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.03571","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Purpose:":[0],"Monocular":[1],"depth":[2,43,134,150,170],"estimation":[3,117,151,171],"(MDE)":[4],"is":[5,79,119],"vital":[6],"for":[7,51,221],"scene":[8],"understanding":[9],"in":[10,191,200],"minimally":[11],"invasive":[12],"surgery":[13],"(MIS).":[14],"However,":[15],"endoscopic":[16,164],"video":[17],"sequences":[18],"are":[19,95],"often":[20],"contaminated":[21],"by":[22,173,196],"smoke,":[23],"specular":[24],"reflections,":[25],"blur,":[26],"and":[27,111,142,153,198,202,205],"occlusions,":[28],"limiting":[29],"the":[30,157,161,178],"accuracy":[31,152,172,187],"of":[32,74,133,188],"MDE":[33,38,62,93,189,207],"models.":[34],"In":[35],"addition,":[36],"current":[37],"models":[39,78,94,190,208],"do":[40],"not":[41],"output":[42],"confidence,":[44],"which":[45],"could":[46],"be":[47,215],"a":[48,59,115],"valuable":[49],"tool":[50],"improving":[52],"their":[53,219],"clinical":[54,163,203,222],"reliability.":[55,135],"Methods:":[56],"We":[57],"propose":[58],"novel":[60],"confidence-aware":[61,98,183],"framework":[63,148,184],"featuring":[64],"three":[65],"significant":[66],"contributions:":[67],"(i)":[68],"Calibrated":[69],"confidence":[70,87,103,116,128,211],"targets:":[71],"an":[72],"ensemble":[73],"fine-tuned":[75],"stereo":[76],"matching":[77],"used":[80,216],"to":[81,125,177,209,217],"capture":[82],"disparity":[83],"variance":[84],"into":[85],"pixel-wise":[86,102],"probabilities;":[88],"(ii)":[89],"Confidence-aware":[90],"loss:":[91],"Baseline":[92],"optimized":[96],"with":[97,121],"loss":[99],"functions,":[100],"utilizing":[101],"probabilities":[104],"such":[105],"that":[106,146,213],"reliable":[107],"pixels":[108],"dominate":[109],"training;":[110],"(iii)":[112],"Inference-time":[113],"confidence:":[114],"head":[118],"proposed":[120],"two":[122],"convolution":[123],"layers":[124],"predict":[126],"per-pixel":[127],"at":[129],"inference,":[130],"enabling":[131],"assessment":[132],"Results:":[136],"Comprehensive":[137],"experimental":[138],"validation":[139],"across":[140],"internal":[141,162],"public":[143],"datasets":[144],"demonstrates":[145],"our":[147],"improves":[149],"can":[154],"robustly":[155],"quantify":[156],"prediction's":[158],"confidence.":[159],"On":[160],"dataset":[165],"(StereoKP),":[166],"we":[167],"improve":[168,218],"dense":[169],"~8%":[174],"as":[175],"compared":[176],"baseline":[179],"model.":[180],"Conclusion:":[181],"Our":[182],"enables":[185],"improved":[186],"MIS,":[192],"addressing":[193],"challenges":[194],"posed":[195],"noise":[197],"artifacts":[199],"pre-clinical":[201],"data,":[204],"allows":[206],"provide":[210],"maps":[212],"may":[214],"reliability":[220],"applications.":[223]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-06T00:00:00"}
