{"id":"https://openalex.org/W4416749893","doi":"https://doi.org/10.1109/iros60139.2025.11247528","title":"EvidMTL: Evidential Multi-Task Learning for Uncertainty-Aware Semantic Surface Mapping from Monocular RGB Images","display_name":"EvidMTL: Evidential Multi-Task Learning for Uncertainty-Aware Semantic Surface Mapping from Monocular RGB Images","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4416749893","doi":"https://doi.org/10.1109/iros60139.2025.11247528"},"language":null,"primary_location":{"id":"doi:10.1109/iros60139.2025.11247528","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11247528","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103089658","display_name":"Rohit Menon","orcid":"https://orcid.org/0000-0001-9724-1182"},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Rohit Menon","raw_affiliation_strings":["University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany"],"affiliations":[{"raw_affiliation_string":"University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany","institution_ids":["https://openalex.org/I135140700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065181173","display_name":"Nils Dengler","orcid":null},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Nils Dengler","raw_affiliation_strings":["University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany"],"affiliations":[{"raw_affiliation_string":"University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany","institution_ids":["https://openalex.org/I135140700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079893673","display_name":"Sicong Pan","orcid":"https://orcid.org/0000-0003-1994-4266"},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Sicong Pan","raw_affiliation_strings":["University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany"],"affiliations":[{"raw_affiliation_string":"University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany","institution_ids":["https://openalex.org/I135140700"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094135039","display_name":"Gokul Krishna Chenchani","orcid":null},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gokul Krishna Chenchani","raw_affiliation_strings":["University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany"],"affiliations":[{"raw_affiliation_string":"University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany","institution_ids":["https://openalex.org/I135140700"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103231515","display_name":"Maren Bennewitz","orcid":"https://orcid.org/0000-0003-4343-3028"},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Maren Bennewitz","raw_affiliation_strings":["University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany"],"affiliations":[{"raw_affiliation_string":"University of Bonn,Humanoid Robots Lab and the Center for Robotics,Germany","institution_ids":["https://openalex.org/I135140700"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5103089658"],"corresponding_institution_ids":["https://openalex.org/I135140700"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.48882976,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"17223","last_page":"17230"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.5896999835968018,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.5896999835968018,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.2425999939441681,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.029200000688433647,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6154000163078308},{"id":"https://openalex.org/keywords/semantic-mapping","display_name":"Semantic mapping","score":0.5792999863624573},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.5573999881744385},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5449000000953674},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5216000080108643},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.4948999881744385},{"id":"https://openalex.org/keywords/evidential-reasoning-approach","display_name":"Evidential reasoning approach","score":0.4250999987125397},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.3840000033378601}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7445999979972839},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.699999988079071},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6154000163078308},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.5792999863624573},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.5573999881744385},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5449000000953674},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5216000080108643},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.4948999881744385},{"id":"https://openalex.org/C156201811","wikidata":"https://www.wikidata.org/wiki/Q5418360","display_name":"Evidential reasoning approach","level":4,"score":0.4250999987125397},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4002000093460083},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.3840000033378601},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.350600004196167},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3424000144004822},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.33180001378059387},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3269999921321869},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.31529998779296875},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.31360000371932983},{"id":"https://openalex.org/C59656382","wikidata":"https://www.wikidata.org/wiki/Q191536","display_name":"Conjunction (astronomy)","level":2,"score":0.30720001459121704},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.28790000081062317},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.28690001368522644},{"id":"https://openalex.org/C57830394","wikidata":"https://www.wikidata.org/wiki/Q278079","display_name":"Posterior probability","level":3,"score":0.272599995136261},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.2567000091075897}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros60139.2025.11247528","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11247528","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W125693051","https://openalex.org/W1901129140","https://openalex.org/W1923697677","https://openalex.org/W1987648924","https://openalex.org/W2012993976","https://openalex.org/W2133844819","https://openalex.org/W2285091887","https://openalex.org/W2520707372","https://openalex.org/W2607968634","https://openalex.org/W2919379406","https://openalex.org/W2963357556","https://openalex.org/W2963677766","https://openalex.org/W2973181288","https://openalex.org/W3090386798","https://openalex.org/W3118635606","https://openalex.org/W3118885154","https://openalex.org/W3173727695","https://openalex.org/W4247250903","https://openalex.org/W4251598436","https://openalex.org/W4312349930","https://openalex.org/W4386065386","https://openalex.org/W4389666105","https://openalex.org/W4389666779","https://openalex.org/W4390873354","https://openalex.org/W4401416751","https://openalex.org/W4405785381","https://openalex.org/W4405787109","https://openalex.org/W4414050933"],"related_works":[],"abstract_inverted_index":{"For":[0],"scene":[1],"understanding":[2],"in":[3,94,166],"unstructured":[4],"environments,":[5],"an":[6,106],"accurate":[7],"and":[8,31,33,60,116,126,132,152,171,179],"uncertainty-aware":[9,64,107,177],"metric-semantic":[10,122],"mapping":[11,23,110,157,169,178],"is":[12],"required":[13],"to":[14,38,144],"enable":[15,71],"informed":[16],"action":[17],"selection":[18],"by":[19,164],"autonomous":[20],"systems.":[21],"Existing":[22],"methods":[24],"often":[25],"suffer":[26],"from":[27,66],"overconfident":[28],"semantic":[29,61,108,153,167],"predictions,":[30],"sparse":[32],"noisy":[34],"depth":[35,58,81,92,115,150],"sensing,":[36],"leading":[37],"inconsistent":[39],"map":[40],"representations.":[41],"In":[42,155],"this":[43],"paper,":[44],"we":[45,76,103],"therefore":[46],"introduce":[47],"EvidMTL,":[48],"a":[49,78],"multitask":[50],"learning":[51],"framework":[52],"that":[53,84],"uses":[54,113],"evidential":[55,73,80,97,114],"heads":[56],"for":[57,119,183],"estimation":[59,142,151],"segmentation,":[62],"enabling":[63],"inference":[65],"monocular":[67],"RGB":[68],"images.":[69],"To":[70],"uncertainty-calibrated":[72],"multi-task":[74],"learning,":[75],"propose":[77],"novel":[79],"loss":[82],"function":[83],"jointly":[85],"optimizes":[86],"the":[87,91,130,174],"belief":[88],"strength":[89],"of":[90,176],"prediction":[93,118],"conjunction":[95],"with":[96],"segmentation":[98],"loss.":[99],"Building":[100],"on":[101,129,137,159],"this,":[102],"present":[104],"EvidKimera,":[105],"surface":[109,168],"framework,":[111],"which":[112],"semantics":[117],"improved":[120],"3D":[121],"consistency.":[123],"We":[124],"train":[125],"evaluate":[127],"EvidMTL":[128],"NYUDepthV2":[131],"assess":[133],"its":[134,181],"zero-shot":[135,156],"performance":[136],"ScanNetV2,":[138,160],"demonstrating":[139],"superior":[140],"uncertainty":[141],"compared":[143],"conventional":[145],"approaches":[146],"while":[147],"maintaining":[148],"comparable":[149],"segmentation.":[154],"tests":[158],"EvidKimera":[161],"outperforms":[162],"Kimera":[163],"30%":[165],"accuracy":[170],"consistency,":[172],"highlighting":[173],"benefits":[175],"underscoring":[180],"potential":[182],"real-world":[184],"robotic":[185],"applications.":[186]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-28T00:00:00"}
