{"id":"https://openalex.org/W4403780629","doi":"https://doi.org/10.1145/3664647.3681122","title":"Cross-Class Domain Adaptive Semantic Segmentation with Visual Language Models","display_name":"Cross-Class Domain Adaptive Semantic Segmentation with Visual Language Models","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403780629","doi":"https://doi.org/10.1145/3664647.3681122"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3681122","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681122","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013976393","display_name":"Wenqi Ren","orcid":"https://orcid.org/0000-0001-5501-2867"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenqi Ren","raw_affiliation_strings":["East China University of Science and Technology, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-5501-2867","affiliations":[{"raw_affiliation_string":"East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080327203","display_name":"Ruihao Xia","orcid":"https://orcid.org/0009-0008-6749-5104"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruihao Xia","raw_affiliation_strings":["East China University of Science and Technology, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0008-6749-5104","affiliations":[{"raw_affiliation_string":"East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038942290","display_name":"Meng Zheng","orcid":"https://orcid.org/0000-0002-6677-2017"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Meng Zheng","raw_affiliation_strings":["United Imaging Intelligence, Burlington, Massachusetts, USA"],"raw_orcid":"https://orcid.org/0000-0002-6677-2017","affiliations":[{"raw_affiliation_string":"United Imaging Intelligence, Burlington, Massachusetts, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003798053","display_name":"Ziyan Wu","orcid":"https://orcid.org/0000-0002-9774-7770"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ziyan Wu","raw_affiliation_strings":["United Imaging Intelligence, Burlington, Massachusetts, USA"],"raw_orcid":"https://orcid.org/0000-0002-9774-7770","affiliations":[{"raw_affiliation_string":"United Imaging Intelligence, Burlington, Massachusetts, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028570509","display_name":"Yang Tang","orcid":"https://orcid.org/0000-0002-2750-8029"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Tang","raw_affiliation_strings":["East China University of Science and Technology, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-2750-8029","affiliations":[{"raw_affiliation_string":"East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027171279","display_name":"Nicu Sebe","orcid":"https://orcid.org/0000-0002-6597-7248"},"institutions":[{"id":"https://openalex.org/I193223587","display_name":"University of Trento","ror":"https://ror.org/05trd4x28","country_code":"IT","type":"education","lineage":["https://openalex.org/I193223587"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Nicu Sebe","raw_affiliation_strings":["University of Trento, Trento, Italy"],"raw_orcid":"https://orcid.org/0000-0002-6597-7248","affiliations":[{"raw_affiliation_string":"University of Trento, Trento, Italy","institution_ids":["https://openalex.org/I193223587"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5013976393"],"corresponding_institution_ids":["https://openalex.org/I143593769"],"apc_list":null,"apc_paid":null,"fwci":0.4762,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.65100098,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"5005","last_page":"5014"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8001275062561035},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6023725271224976},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.598082959651947},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5920470952987671},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5468579530715942},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.49981236457824707},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08695146441459656}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8001275062561035},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6023725271224976},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.598082959651947},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5920470952987671},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5468579530715942},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.49981236457824707},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08695146441459656},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3664647.3681122","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681122","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:iris.unitn.it:11572/439450","is_oa":false,"landing_page_url":"https://hdl.handle.net/11572/439450","pdf_url":null,"source":{"id":"https://openalex.org/S4306401913","display_name":"Institutional Research Information System (Universit\u00e0 degli Studi di Trento)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I193223587","host_organization_name":"University of Trento","host_organization_lineage":["https://openalex.org/I193223587"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1984685202","https://openalex.org/W2186222003","https://openalex.org/W2340897893","https://openalex.org/W2559655401","https://openalex.org/W2779610669","https://openalex.org/W2795889831","https://openalex.org/W2798593490","https://openalex.org/W2887964057","https://openalex.org/W2901870313","https://openalex.org/W2948429981","https://openalex.org/W2962687275","https://openalex.org/W2963073217","https://openalex.org/W2981429991","https://openalex.org/W2985406498","https://openalex.org/W2997910357","https://openalex.org/W2998115938","https://openalex.org/W3034723751","https://openalex.org/W3035236545","https://openalex.org/W3035294798","https://openalex.org/W3108560336","https://openalex.org/W3110437118","https://openalex.org/W3120562181","https://openalex.org/W3120804725","https://openalex.org/W3171007011","https://openalex.org/W3180659539","https://openalex.org/W3183166151","https://openalex.org/W3190096330","https://openalex.org/W3204557602","https://openalex.org/W3205021045","https://openalex.org/W3206360173","https://openalex.org/W3213165621","https://openalex.org/W3217147624","https://openalex.org/W4234552385","https://openalex.org/W4295788754","https://openalex.org/W4304091837","https://openalex.org/W4304092597","https://openalex.org/W4312458986","https://openalex.org/W4312768455","https://openalex.org/W4312832581","https://openalex.org/W4366995877","https://openalex.org/W4386047746","https://openalex.org/W4386065590","https://openalex.org/W4386071707","https://openalex.org/W4386075561","https://openalex.org/W4386076397","https://openalex.org/W4390872487","https://openalex.org/W4390874217"],"related_works":["https://openalex.org/W4379231730","https://openalex.org/W4389858081","https://openalex.org/W2501551404","https://openalex.org/W4298131179","https://openalex.org/W2113201962","https://openalex.org/W4385583601","https://openalex.org/W4395685956","https://openalex.org/W2799953226","https://openalex.org/W4398146871","https://openalex.org/W3204019825"],"abstract_inverted_index":{"This":[0,33],"paper":[1],"addresses":[2],"the":[3,14,30,38,46,120,133,159,170],"issue":[4],"of":[5,40,49,71,122,135,162,174],"cross-class":[6,53],"domain":[7,16],"adaptation":[8],"(CCDA)":[9],"in":[10,29],"semantic":[11,112],"segmentation,":[12],"where":[13],"target":[15],"contains":[17],"both":[18,50],"shared":[19],"and":[20,52,68,114,172],"novel":[21,43,94,136,163],"classes":[22,44],"that":[23,97],"are":[24,69,154],"either":[25],"unlabeled":[26],"or":[27],"unseen":[28],"source":[31],"domain.":[32],"problem":[34],"is":[35],"challenging,":[36],"as":[37],"absence":[39],"labels":[41,92,124],"for":[42,93],"hampers":[45],"effective":[47],"solutions":[48],"cross-domain":[51],"problems.":[54],"Since":[55],"Visual":[56],"Language":[57],"Models":[58],"(VLMs)":[59],"have":[60],"exhibited":[61],"impressive":[62],"generalization":[63],"across":[64,178],"diverse":[65],"data":[66],"distributions":[67],"capable":[70],"generating":[72],"zero-shot":[73],"predictions":[74],"without":[75],"requiring":[76],"task-specific":[77],"training":[78],"examples,":[79],"we":[80,104,138,168],"propose":[81],"a":[82,106,116],"label":[83],"alignment":[84],"method":[85,108,177],"by":[86],"leveraging":[87],"VLMs":[88,98],"to":[89,109,125,147,157],"relabel":[90],"pseudo":[91,123],"classes.":[95,164],"Considering":[96],"typically":[99],"provide":[100],"only":[101],"image-level":[102],"predictions,":[103,152],"embed":[105],"two-stage":[107],"enable":[110],"fine-grained":[111],"segmentation":[113],"design":[115],"threshold":[117],"based":[118],"on":[119],"uncertainty":[121],"exclude":[126],"noisy":[127],"VLM":[128,151],"predictions.":[129],"To":[130],"further":[131],"augment":[132],"supervision":[134],"classes,":[137],"devise":[139],"memory":[140],"banks":[141],"with":[142],"an":[143],"adaptive":[144],"update":[145],"scheme":[146],"effectively":[148],"manage":[149],"accurate":[150],"which":[153],"then":[155],"resampled":[156],"increase":[158],"sampling":[160],"probability":[161],"Through":[165],"comprehensive":[166],"experiments,":[167],"demonstrate":[169],"effectiveness":[171],"versatility":[173],"our":[175],"proposed":[176],"various":[179],"CCDA":[180],"scenarios.":[181]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-12-19T19:40:27.379048","created_date":"2025-10-10T00:00:00"}
