{"id":"https://openalex.org/W7162486749","doi":"https://doi.org/10.1109/3dv69130.2026.00178","title":"DINO in the Room: Leveraging 2D Foundation Models for 3D Segmentation","display_name":"DINO in the Room: Leveraging 2D Foundation Models for 3D Segmentation","publication_year":2026,"publication_date":"2026-03-20","ids":{"openalex":"https://openalex.org/W7162486749","doi":"https://doi.org/10.1109/3dv69130.2026.00178"},"language":null,"primary_location":{"id":"doi:10.1109/3dv69130.2026.00178","is_oa":false,"landing_page_url":"https://doi.org/10.1109/3dv69130.2026.00178","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on 3D Vision (3DV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137163339","display_name":"Karim Knaebel","orcid":null},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Karim Knaebel","raw_affiliation_strings":["RWTH Aachen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RWTH Aachen University","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045844841","display_name":"Kadir Y\u0131lmaz","orcid":"https://orcid.org/0000-0002-0819-3420"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Kadir Yilmaz","raw_affiliation_strings":["RWTH Aachen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RWTH Aachen University","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061463972","display_name":"Daan de Geus","orcid":"https://orcid.org/0000-0003-0559-5341"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Daan De Geus","raw_affiliation_strings":["RWTH Aachen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RWTH Aachen University","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071563379","display_name":"Alexander Hermans","orcid":"https://orcid.org/0000-0003-2127-0782"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Alexander Hermans","raw_affiliation_strings":["RWTH Aachen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RWTH Aachen University","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137093747","display_name":"David Adrian","orcid":null},"institutions":[{"id":"https://openalex.org/I4210151956","display_name":"Robert Bosch (India)","ror":"https://ror.org/04my8ty22","country_code":"IN","type":"company","lineage":["https://openalex.org/I4210151956","https://openalex.org/I889804353"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"David Adrian","raw_affiliation_strings":["Bosch Center for AI"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bosch Center for AI","institution_ids":["https://openalex.org/I4210151956"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084203306","display_name":"Timm Linder","orcid":"https://orcid.org/0000-0001-8532-0262"},"institutions":[{"id":"https://openalex.org/I4210151956","display_name":"Robert Bosch (India)","ror":"https://ror.org/04my8ty22","country_code":"IN","type":"company","lineage":["https://openalex.org/I4210151956","https://openalex.org/I889804353"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Timm Linder","raw_affiliation_strings":["Bosch Center for AI"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bosch Center for AI","institution_ids":["https://openalex.org/I4210151956"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071006649","display_name":"Bastian Leibe","orcid":"https://orcid.org/0000-0003-4225-0051"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Bastian Leibe","raw_affiliation_strings":["RWTH Aachen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"RWTH Aachen University","institution_ids":["https://openalex.org/I887968799"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.83659993,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1884","last_page":"1894"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.38850000500679016,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.38850000500679016,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.09139999747276306,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.05990000069141388,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.4528000056743622},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.44290000200271606},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.301800012588501},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.2969000041484833},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.27469998598098755}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6355999708175659},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.4528000056743622},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.44290000200271606},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4187000095844269},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.301800012588501},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.27469998598098755},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.26649999618530273},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2587999999523163}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/3dv69130.2026.00178","is_oa":false,"landing_page_url":"https://doi.org/10.1109/3dv69130.2026.00178","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on 3D Vision (3DV)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W1836465849","https://openalex.org/W2108598243","https://openalex.org/W2407386500","https://openalex.org/W2460657278","https://openalex.org/W2560609797","https://openalex.org/W2594519801","https://openalex.org/W2963125977","https://openalex.org/W2963182550","https://openalex.org/W2990613095","https://openalex.org/W2991216808","https://openalex.org/W3010797203","https://openalex.org/W3035172746","https://openalex.org/W3035574168","https://openalex.org/W3109154950","https://openalex.org/W3109728105","https://openalex.org/W3110503160","https://openalex.org/W3159481202","https://openalex.org/W3166573884","https://openalex.org/W3172717135","https://openalex.org/W3173732446","https://openalex.org/W3177330511","https://openalex.org/W4214755140","https://openalex.org/W4307104049","https://openalex.org/W4312414163","https://openalex.org/W4312649925","https://openalex.org/W4312933868","https://openalex.org/W4313128851","https://openalex.org/W4313145913","https://openalex.org/W4372283849","https://openalex.org/W4386065407","https://openalex.org/W4386065742","https://openalex.org/W4386071758","https://openalex.org/W4386075694","https://openalex.org/W4386075910","https://openalex.org/W4389000546","https://openalex.org/W4390873101","https://openalex.org/W4390873312","https://openalex.org/W4390874108","https://openalex.org/W4390874575","https://openalex.org/W4399146248","https://openalex.org/W4400721967","https://openalex.org/W4401413704","https://openalex.org/W4402667891","https://openalex.org/W4402727277","https://openalex.org/W4402727700","https://openalex.org/W4402727896","https://openalex.org/W4402728013","https://openalex.org/W4402753920","https://openalex.org/W4402916738","https://openalex.org/W4403049399","https://openalex.org/W4403889366","https://openalex.org/W4403905949","https://openalex.org/W4404690790","https://openalex.org/W4407900973","https://openalex.org/W4413144796","https://openalex.org/W4413146709","https://openalex.org/W4413147663","https://openalex.org/W7133207924"],"related_works":[],"abstract_inverted_index":{"Vision":[0],"foundation":[1,94,148],"models":[2,72,144],"(VFMs)":[3],"trained":[4],"on":[5,62,116],"large-scale":[6],"image":[7],"datasets":[8],"provide":[9],"high-quality":[10],"features":[11],"that":[12,88],"have":[13],"significantly":[14],"advanced":[15],"<tex":[16,37,90],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[17,38,91],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$2":[18,39,92],"D$</tex>":[19,40,93],"visual":[20],"recognition.":[21],"However,":[22],"their":[23],"potential":[24],"in":[25],"3D":[26,43,58,63,71,107,121,143,153,168],"scene":[27],"segmentation":[28,110,123,169],"remains":[29],"largely":[30],"untapped,":[31],"despite":[32],"the":[33,66,127,152],"common":[34],"availability":[35],"of":[36,68,129],"images":[41,133],"alongside":[42],"point":[44,108],"cloud":[45,109],"datasets.":[46,176],"While":[47],"significant":[48],"research":[49],"has":[50],"been":[51],"dedicated":[52],"to":[53,99,141],"2D-3D":[54],"fusion,":[55],"recent":[56],"state-of-the-art":[57,114],"methods":[59],"predominantly":[60],"focus":[61],"data,":[64],"leaving":[65],"integration":[67],"VFMs":[69,130],"into":[70,105],"underexplored.":[73],"In":[74],"this":[75,79],"work,":[76],"we":[77,138,161],"challenge":[78],"trend":[80],"by":[81,145],"introducing":[82],"DITR,":[83],"a":[84,106,163],"generally":[85],"applicable":[86],"approach":[87],"extracts":[89],"model":[95],"features,":[96],"projects":[97],"them":[98,104],"3D,":[100],"and":[101,119],"finally":[102],"injects":[103],"model.":[111],"DITR":[112],"achieves":[113],"results":[115],"both":[117],"indoor":[118],"outdoor":[120],"semantic":[122],"benchmarks.":[124],"To":[125],"enable":[126],"use":[128],"even":[131],"when":[132],"are":[134],"unavailable":[135],"during":[136],"inference,":[137],"additionally":[139],"propose":[140],"pretrain":[142],"distilling":[146],"2D":[147,159],"models.":[149],"By":[150],"initializing":[151],"backbone":[154],"with":[155],"knowledge":[156],"distilled":[157],"from":[158],"VFMs,":[160],"create":[162],"strong":[164],"basis":[165],"for":[166],"downstream":[167],"tasks,":[170],"ultimately":[171],"boosting":[172],"performance":[173],"across":[174],"various":[175]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-28T00:00:00"}
