{"id":"https://openalex.org/W4406412134","doi":"https://doi.org/10.1007/s11263-024-02320-3","title":"Unsupervised Semantic Segmentation of Urban Scenes via Cross-Modal Distillation","display_name":"Unsupervised Semantic Segmentation of Urban Scenes via Cross-Modal Distillation","publication_year":2025,"publication_date":"2025-01-15","ids":{"openalex":"https://openalex.org/W4406412134","doi":"https://doi.org/10.1007/s11263-024-02320-3"},"language":"en","primary_location":{"id":"doi:10.1007/s11263-024-02320-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11263-024-02320-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11263-024-02320-3.pdf","source":{"id":"https://openalex.org/S25538012","display_name":"International Journal of Computer Vision","issn_l":"0920-5691","issn":["0920-5691","1573-1405"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Computer Vision","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11263-024-02320-3.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017371568","display_name":"Anton\u00edn Vobeck\u00fd","orcid":"https://orcid.org/0000-0001-8946-2057"},"institutions":[{"id":"https://openalex.org/I220619192","display_name":"Valeo (France)","ror":"https://ror.org/04ryqpf83","country_code":"FR","type":"company","lineage":["https://openalex.org/I220619192"]},{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ","FR"],"is_corresponding":true,"raw_author_name":"Antonin Vobecky","raw_affiliation_strings":["Czech Institute of Informatics, Robotics and Cybernetics, Czech Technical University in Prague, Prague, Czech Republic","Faculty of Electrical Engineering, Czech Technical University in Prague, Prague, France","valeo.ai, Paris, France"],"affiliations":[{"raw_affiliation_string":"Czech Institute of Informatics, Robotics and Cybernetics, Czech Technical University in Prague, Prague, Czech Republic","institution_ids":["https://openalex.org/I44504214"]},{"raw_affiliation_string":"Faculty of Electrical Engineering, Czech Technical University in Prague, Prague, France","institution_ids":["https://openalex.org/I44504214"]},{"raw_affiliation_string":"valeo.ai, Paris, France","institution_ids":["https://openalex.org/I220619192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086144380","display_name":"David Hurych","orcid":"https://orcid.org/0000-0002-0580-4038"},"institutions":[{"id":"https://openalex.org/I220619192","display_name":"Valeo (France)","ror":"https://ror.org/04ryqpf83","country_code":"FR","type":"company","lineage":["https://openalex.org/I220619192"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"David Hurych","raw_affiliation_strings":["valeo.ai, Paris, France"],"affiliations":[{"raw_affiliation_string":"valeo.ai, Paris, France","institution_ids":["https://openalex.org/I220619192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082234499","display_name":"Oriane Sim\u00e9oni","orcid":"https://orcid.org/0000-0003-3232-8978"},"institutions":[{"id":"https://openalex.org/I220619192","display_name":"Valeo (France)","ror":"https://ror.org/04ryqpf83","country_code":"FR","type":"company","lineage":["https://openalex.org/I220619192"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Oriane Sim\u00e9oni","raw_affiliation_strings":["valeo.ai, Paris, France"],"affiliations":[{"raw_affiliation_string":"valeo.ai, Paris, France","institution_ids":["https://openalex.org/I220619192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070809773","display_name":"Spyros Gidaris","orcid":"https://orcid.org/0000-0003-1515-3635"},"institutions":[{"id":"https://openalex.org/I220619192","display_name":"Valeo (France)","ror":"https://ror.org/04ryqpf83","country_code":"FR","type":"company","lineage":["https://openalex.org/I220619192"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Spyros Gidaris","raw_affiliation_strings":["valeo.ai, Paris, France"],"affiliations":[{"raw_affiliation_string":"valeo.ai, Paris, France","institution_ids":["https://openalex.org/I220619192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003783466","display_name":"Andrei Bursuc","orcid":"https://orcid.org/0000-0003-2485-9402"},"institutions":[{"id":"https://openalex.org/I220619192","display_name":"Valeo (France)","ror":"https://ror.org/04ryqpf83","country_code":"FR","type":"company","lineage":["https://openalex.org/I220619192"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Andrei Bursuc","raw_affiliation_strings":["valeo.ai, Paris, France"],"affiliations":[{"raw_affiliation_string":"valeo.ai, Paris, France","institution_ids":["https://openalex.org/I220619192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076170578","display_name":"Patrick P\u00e9rez","orcid":"https://orcid.org/0000-0002-8124-1206"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Patrick P\u00e9rez","raw_affiliation_strings":["Kyutai, Paris, France"],"affiliations":[{"raw_affiliation_string":"Kyutai, Paris, France","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025398783","display_name":"Josef \u0160ivic","orcid":"https://orcid.org/0000-0002-2554-5301"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Josef Sivic","raw_affiliation_strings":["Czech Institute of Informatics, Robotics and Cybernetics, Czech Technical University in Prague, Prague, Czech Republic"],"affiliations":[{"raw_affiliation_string":"Czech Institute of Informatics, Robotics and Cybernetics, Czech Technical University in Prague, Prague, Czech Republic","institution_ids":["https://openalex.org/I44504214"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5017371568"],"corresponding_institution_ids":["https://openalex.org/I220619192","https://openalex.org/I44504214"],"apc_list":{"value":2890,"currency":"EUR","value_usd":3690},"apc_paid":{"value":2890,"currency":"EUR","value_usd":3690},"fwci":5.6305,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.94881231,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"133","issue":"6","first_page":"3519","last_page":"3541"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13282","display_name":"Automated Road and Building Extraction","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13282","display_name":"Automated Road and Building Extraction","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11164","display_name":"Remote Sensing and LiDAR Applications","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.7366219162940979},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7181494832038879},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7020589113235474},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.632145345211029},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6181874871253967},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.433852881193161},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.06585466861724854}],"concepts":[{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.7366219162940979},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7181494832038879},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7020589113235474},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.632145345211029},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6181874871253967},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.433852881193161},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.06585466861724854},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s11263-024-02320-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11263-024-02320-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11263-024-02320-3.pdf","source":{"id":"https://openalex.org/S25538012","display_name":"International Journal of Computer Vision","issn_l":"0920-5691","issn":["0920-5691","1573-1405"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Computer Vision","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s11263-024-02320-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11263-024-02320-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11263-024-02320-3.pdf","source":{"id":"https://openalex.org/S25538012","display_name":"International Journal of Computer Vision","issn_l":"0920-5691","issn":["0920-5691","1573-1405"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Computer Vision","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1322491984","display_name":null,"funder_award_id":"CZ.02.1.010.00.015 0030000468","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"},{"id":"https://openalex.org/G1507807434","display_name":null,"funder_award_id":"GS21184OHK33T37","funder_id":"https://openalex.org/F4320309972","funder_display_name":"\u010cesk\u00e9 Vysok\u00e9 U\u010den\u00ed Technick\u00e9 v Praze"},{"id":"https://openalex.org/G6862666737","display_name":null,"funder_award_id":"90140","funder_id":"https://openalex.org/F4320321005","funder_display_name":"Ministerstvo \u0160kolstv\u00ed, Ml\u00e1de\u017ee a T\u011blov\u00fdchovy"}],"funders":[{"id":"https://openalex.org/F4320309972","display_name":"\u010cesk\u00e9 Vysok\u00e9 U\u010den\u00ed Technick\u00e9 v Praze","ror":"https://ror.org/03kqpb082"},{"id":"https://openalex.org/F4320321005","display_name":"Ministerstvo \u0160kolstv\u00ed, Ml\u00e1de\u017ee a T\u011blov\u00fdchovy","ror":"https://ror.org/037n8p820"},{"id":"https://openalex.org/F4320335322","display_name":"European Regional Development Fund","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4406412134.pdf","grobid_xml":"https://content.openalex.org/works/W4406412134.grobid-xml"},"referenced_works_count":69,"referenced_works":["https://openalex.org/W764651262","https://openalex.org/W1901129140","https://openalex.org/W1903029394","https://openalex.org/W1999478155","https://openalex.org/W2108598243","https://openalex.org/W2194775991","https://openalex.org/W2222512263","https://openalex.org/W2340897893","https://openalex.org/W2560023338","https://openalex.org/W2565639579","https://openalex.org/W2592691248","https://openalex.org/W2595724883","https://openalex.org/W2612690371","https://openalex.org/W2614543743","https://openalex.org/W2619697695","https://openalex.org/W2781228439","https://openalex.org/W2801780873","https://openalex.org/W2883725317","https://openalex.org/W2901870313","https://openalex.org/W2947847748","https://openalex.org/W2952735550","https://openalex.org/W2962865004","https://openalex.org/W2962960500","https://openalex.org/W2964185501","https://openalex.org/W2964309882","https://openalex.org/W2968443604","https://openalex.org/W2982106100","https://openalex.org/W2990138404","https://openalex.org/W2990408345","https://openalex.org/W2990500698","https://openalex.org/W3014641072","https://openalex.org/W3034355852","https://openalex.org/W3035060554","https://openalex.org/W3035172746","https://openalex.org/W3035524453","https://openalex.org/W3035564946","https://openalex.org/W3035574168","https://openalex.org/W3035635319","https://openalex.org/W3035750252","https://openalex.org/W3037309139","https://openalex.org/W3105770007","https://openalex.org/W3107725261","https://openalex.org/W3109301572","https://openalex.org/W3111740481","https://openalex.org/W3114677757","https://openalex.org/W3129110783","https://openalex.org/W3153167542","https://openalex.org/W3159481202","https://openalex.org/W3170088426","https://openalex.org/W3170841864","https://openalex.org/W3171581326","https://openalex.org/W3172456032","https://openalex.org/W3172615411","https://openalex.org/W3175492513","https://openalex.org/W3182978476","https://openalex.org/W3198721070","https://openalex.org/W3207649350","https://openalex.org/W4214504406","https://openalex.org/W4214507759","https://openalex.org/W4214893857","https://openalex.org/W4313123540","https://openalex.org/W4366208220","https://openalex.org/W4386076264","https://openalex.org/W4388032340","https://openalex.org/W4390874346","https://openalex.org/W6638523607","https://openalex.org/W6763612067","https://openalex.org/W6797589674","https://openalex.org/W6856857450"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Abstract":[0],"Semantic":[1],"image":[2,82,141,156],"segmentation":[3,24,41,76],"models":[4],"typically":[5],"require":[6],"extensive":[7],"pixel-wise":[8,39],"annotations,":[9],"which":[10],"are":[11,61],"costly":[12],"to":[13,17,104,149],"obtain":[14],"and":[15,49,81,125,181,208,231,247,258],"prone":[16],"biases.":[18],"Our":[19,59],"work":[20],"investigates":[21],"learning":[22,38,73],"semantic":[23,40,75,155],"in":[25],"urban":[26],"scenes":[27],"without":[28,210],"any":[29,211],"manual":[30,57],"annotation.":[31],"We":[32,188,213],"propose":[33],"a":[34,67,135,151,173],"novel":[35,68],"method":[36,89,195],"for":[37,56,70,107,154],"using":[42,172,226],"raw,":[43],"uncurated":[44],"data":[45,142],"from":[46,185],"vehicle-mounted":[47],"cameras":[48],"LiDAR":[50,80,101],"sensors,":[51],"thus":[52],"eliminating":[53],"the":[54,91,100,146,169,186,190,220,243],"need":[55],"labeling.":[58],"contributions":[60],"as":[62,252,254],"follows.":[63],"First,":[64],"we":[65,112,133,159],"develop":[66],"approach":[69,166],"cross-modal":[71,136],"unsupervised":[72],"of":[74,87,93,164,193,219,242,245],"by":[77,167,196],"leveraging":[78],"synchronized":[79],"data.":[83],"A":[84],"crucial":[85],"element":[86],"our":[88,165,194],"is":[90],"integration":[92],"an":[94,177,215],"object":[95,117],"proposal":[96],"module":[97],"that":[98,114,139],"examines":[99],"point":[102],"cloud":[103],"generate":[105],"proposals":[106,118],"spatially":[108],"consistent":[109],"objects.":[110],"Second,":[111],"demonstrate":[113,160],"these":[115],"3D":[116],"can":[119],"be":[120],"aligned":[121],"with":[122,145,176],"corresponding":[123],"images":[124],"effectively":[126],"grouped":[127],"into":[128],"semantically":[129],"meaningful":[130],"pseudo-classes.":[131],"Third,":[132],"introduce":[134],"distillation":[137,175],"technique":[138],"utilizes":[140],"partially":[143],"annotated":[144],"learnt":[147],"pseudo-classes":[148],"train":[150],"transformer-based":[152],"model":[153,171,222],"segmentation.":[157],"Fourth,":[158],"further":[161],"significant":[162],"improvements":[163],"extending":[168],"proposed":[170,221],"teacher-student":[174],"exponential":[178],"moving":[179],"average":[180],"incorporating":[182],"soft":[183],"targets":[184],"teacher.":[187],"show":[189],"generalization":[191],"capabilities":[192],"testing":[197,201],"on":[198],"four":[199],"different":[200],"datasets":[202],"(Cityscapes,":[203],"Dark":[204],"Zurich,":[205],"Nighttime":[206],"Driving,":[207],"ACDC)":[209],"fine-tuning.":[212],"present":[214],"in-depth":[216],"experimental":[217],"analysis":[218],"including":[223],"results":[224,257],"when":[225],"another":[227],"pre-training":[228],"dataset,":[229],"per-class":[230],"pixel":[232],"accuracy":[233],"results,":[234],"confusion":[235],"matrices,":[236],"PCA":[237],"visualization,":[238],"k-NN":[239],"evaluation,":[240],"ablations":[241],"number":[244],"clusters":[246],"LiDAR\u2019s":[248],"density,":[249],"supervised":[250],"finetuning":[251],"well":[253],"additional":[255],"qualitative":[256],"their":[259],"analysis.":[260]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
