{"id":"https://openalex.org/W7131379636","doi":"https://doi.org/10.48550/arxiv.2602.20423","title":"MedCLIPSeg: Probabilistic Vision-Language Adaptation for Data-Efficient and Generalizable Medical Image Segmentation","display_name":"MedCLIPSeg: Probabilistic Vision-Language Adaptation for Data-Efficient and Generalizable Medical Image Segmentation","publication_year":2026,"publication_date":"2026-02-23","ids":{"openalex":"https://openalex.org/W7131379636","doi":"https://doi.org/10.48550/arxiv.2602.20423"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.20423","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094302690","display_name":"Taha Koleilat","orcid":"https://orcid.org/0009-0005-9655-0588"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koleilat, Taha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092171892","display_name":"Hojat Asgariandehkordi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Asgariandehkordi, Hojat","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045952897","display_name":"Omid Nejati Manzari","orcid":"https://orcid.org/0000-0001-5133-3831"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manzari, Omid Nejati","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004598895","display_name":"Berardino Barile","orcid":"https://orcid.org/0000-0002-4016-9172"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barile, Berardino","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126795202","display_name":"Yiming Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Yiming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5077743201","display_name":"Hassan Rivaz","orcid":"https://orcid.org/0000-0001-5800-3034"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rivaz, Hassan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.42399999499320984,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.42399999499320984,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.18860000371932983,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.18119999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.7283999919891357},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6891000270843506},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5806000232696533},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5774999856948853},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5393999814987183},{"id":"https://openalex.org/keywords/domain-adaptation","display_name":"Domain adaptation","score":0.5069000124931335},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5056999921798706},{"id":"https://openalex.org/keywords/medical-diagnosis","display_name":"Medical diagnosis","score":0.4672999978065491}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7494999766349792},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.7283999919891357},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6991000175476074},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6891000270843506},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5806000232696533},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5774999856948853},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5393999814987183},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.5069000124931335},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5056999921798706},{"id":"https://openalex.org/C534262118","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Medical diagnosis","level":2,"score":0.4672999978065491},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4575999975204468},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.4417000114917755},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.4032000005245209},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.40059998631477356},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39070001244544983},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3691999912261963},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.36809998750686646},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.3515999913215637},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.31839999556541443},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.3149000108242035},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.311599999666214},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2854999899864197},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2583000063896179}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.20423","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.20423","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.20423","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.20423","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"score":0.5235657095909119,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Medical":[0],"image":[1,33,52,68,150],"segmentation":[2,34,136],"remains":[3,35],"challenging":[4],"due":[5],"to":[6],"limited":[7],"annotations":[8],"for":[9,29,46,147],"training,":[10],"ambiguous":[11],"anatomical":[12],"features,":[13],"and":[14,49,69,72,100,112,124],"domain":[15,101],"shifts.":[16],"While":[17],"vision-language":[18,145],"models":[19],"such":[20],"as":[21],"CLIP":[22,45,58],"offer":[23],"strong":[24],"cross-modal":[25,62],"representations,":[26],"their":[27],"potential":[28,142],"dense,":[30],"text-guided":[31],"medical":[32,51,149],"underexplored.":[36],"We":[37],"present":[38],"MedCLIPSeg,":[39],"a":[40,80],"novel":[41],"framework":[42],"that":[43,85,116,131],"adapts":[44],"robust,":[47],"data-efficient,":[48],"uncertainty-aware":[50],"segmentation.":[53,151],"Our":[54],"approach":[55],"leverages":[56],"patch-level":[57,82],"embeddings":[59],"through":[60],"probabilistic":[61,144],"attention,":[63],"enabling":[64],"bidirectional":[65],"interaction":[66],"between":[67],"text":[70],"tokens":[71],"explicit":[73],"modeling":[74,146],"of":[75,135,143],"predictive":[76],"uncertainty.":[77],"Together":[78],"with":[79],"soft":[81],"contrastive":[83],"loss":[84],"encourages":[86],"more":[87],"nuanced":[88],"semantic":[89],"learning":[90],"across":[91,105],"diverse":[92],"textual":[93],"prompts,":[94],"MedCLIPSeg":[95,117],"effectively":[96],"improves":[97],"data":[98],"efficiency":[99],"generalizability.":[102],"Extensive":[103],"experiments":[104],"16":[106],"datasets":[107],"spanning":[108],"five":[109],"imaging":[110],"modalities":[111],"six":[113],"organs":[114],"demonstrate":[115],"outperforms":[118],"prior":[119],"methods":[120],"in":[121],"accuracy,":[122],"efficiency,":[123],"robustness,":[125],"while":[126],"providing":[127],"interpretable":[128],"uncertainty":[129],"maps":[130],"highlight":[132],"local":[133],"reliability":[134],"results.":[137],"This":[138],"work":[139],"demonstrates":[140],"the":[141],"text-driven":[148]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-02-26T00:00:00"}
