{"id":"https://openalex.org/W7160235950","doi":"https://doi.org/10.1109/wacv61042.2026.00517","title":"HiMix : Hierarchical Visual-Textual Mixing Network for Lesion Segmentation","display_name":"HiMix : Hierarchical Visual-Textual Mixing Network for Lesion Segmentation","publication_year":2026,"publication_date":"2026-03-06","ids":{"openalex":"https://openalex.org/W7160235950","doi":"https://doi.org/10.1109/wacv61042.2026.00517"},"language":null,"primary_location":{"id":"doi:10.1109/wacv61042.2026.00517","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv61042.2026.00517","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110186886","display_name":"Soojin Hwang","orcid":null},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Soojin Hwang","raw_affiliation_strings":["Pohang University of Science and Technology (POSTECH)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology (POSTECH)","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104264406","display_name":"Jaeyoon Sim","orcid":null},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaeyoon Sim","raw_affiliation_strings":["Pohang University of Science and Technology (POSTECH)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology (POSTECH)","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5135393105","display_name":"Won Hwa Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Won Hwa Kim","raw_affiliation_strings":["Pohang University of Science and Technology (POSTECH)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Pohang University of Science and Technology (POSTECH)","institution_ids":["https://openalex.org/I123900574"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110186886"],"corresponding_institution_ids":["https://openalex.org/I123900574"],"apc_list":null,"apc_paid":null,"fwci":21.8359,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.99298581,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5332","last_page":"5341"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6003999710083008,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6003999710083008,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.08380000293254852,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.033799998462200165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5159000158309937},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5152999758720398},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.3643999993801117},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.35989999771118164},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.31709998846054077}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.659500002861023},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5351999998092651},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5159000158309937},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5152999758720398},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.478300005197525},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3643999993801117},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.35989999771118164},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C138777275","wikidata":"https://www.wikidata.org/wiki/Q6884054","display_name":"Mixing (physics)","level":2,"score":0.31369999051094055},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.2630999982357025},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.26159998774528503}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/wacv61042.2026.00517","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv61042.2026.00517","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2146296749","https://openalex.org/W2734349601","https://openalex.org/W2884436604","https://openalex.org/W2911489562","https://openalex.org/W2948947170","https://openalex.org/W2963341956","https://openalex.org/W2964303116","https://openalex.org/W2994720379","https://openalex.org/W2995225687","https://openalex.org/W2997286550","https://openalex.org/W3014974815","https://openalex.org/W3034238904","https://openalex.org/W3046375318","https://openalex.org/W3118485687","https://openalex.org/W3197957534","https://openalex.org/W3201906559","https://openalex.org/W3202533032","https://openalex.org/W4200631575","https://openalex.org/W4212875960","https://openalex.org/W4221163766","https://openalex.org/W4295915728","https://openalex.org/W4295937486","https://openalex.org/W4308235625","https://openalex.org/W4312443924","https://openalex.org/W4312533035","https://openalex.org/W4321232185","https://openalex.org/W4382998948","https://openalex.org/W4385573131","https://openalex.org/W4385764483","https://openalex.org/W4387211388","https://openalex.org/W4387211904","https://openalex.org/W4390873528","https://openalex.org/W4391109864","https://openalex.org/W4392449449","https://openalex.org/W4393159347","https://openalex.org/W4394596572","https://openalex.org/W4400881081","https://openalex.org/W4402076595","https://openalex.org/W4403067383","https://openalex.org/W4403088732","https://openalex.org/W4405812102","https://openalex.org/W4406569078","https://openalex.org/W4414243662","https://openalex.org/W4414694048"],"related_works":[],"abstract_inverted_index":{"Lesion":[0],"segmentation":[1,51,110],"is":[2],"an":[3],"essential":[4,91],"task":[5],"in":[6,23,34,48,187],"medical":[7,36,49],"imaging":[8],"to":[9,39,74,87,133,142,179],"support":[10],"diagnosis":[11],"and":[12,72,80,94,116,147,162,171],"assessment":[13],"of":[14,155],"pathologies.":[15],"While":[16],"deep":[17],"learning":[18],"models":[19],"have":[20,52],"shown":[21],"success":[22],"various":[24],"domains,":[25],"their":[26,85],"reliance":[27],"on":[28,158],"large-scale":[29],"annotated":[30],"datasets":[31,164],"limits":[32,84],"applicability":[33,186],"the":[35,120,144,159],"domain":[37],"due":[38],"labeling":[40],"cost.":[41],"To":[42],"address":[43],"this":[44,98],"issue,":[45],"recent":[46],"studies":[47],"image":[50,115,139],"utilized":[53],"clinical":[54,189],"texts":[55],"as":[56],"complementary":[57],"semantic":[58],"cues":[59,90],"without":[60],"additional":[61],"annotations.":[62],"However,":[63],"most":[64],"existing":[65],"methods":[66],"utilize":[67],"a":[68,107],"single":[69],"textual":[70,181],"embedding":[71],"fail":[73],"capture":[75],"hierarchical":[76,127],"interactions":[77],"between":[78],"language":[79],"visual":[81,149],"features,":[82],"which":[83],"ability":[86],"leverage":[88],"fine-grained":[89,134],"for":[92],"precise":[93],"detailed":[95],"segmentation.":[96],"In":[97],"regime,":[99],"we":[100],"propose":[101],"Hierarchical":[102],"Visual-Textual":[103],"Mixing":[104],"Network":[105],"(HiMix),":[106],"novel":[108],"multi-modal":[109,172],"framework":[111],"that":[112,166],"mixes":[113],"multi-scale":[114],"text":[117,128],"representations":[118],"throughout":[119],"mask":[121],"decoding":[122],"process.":[123],"HiMix":[124,167,175],"progressively":[125],"injects":[126],"embedding,":[129],"from":[130],"high-level":[131],"semantics":[132],"spatial":[135],"details,":[136],"into":[137],"corresponding":[138],"decoder":[140],"layers":[141],"bridge":[143],"modality":[145],"gap":[146],"enhance":[148],"feature":[150],"refinement":[151],"at":[152],"multiple":[153],"levels":[154],"abstraction.":[156],"Experiments":[157],"QaTa-COV19,":[160],"MosMed-Data+":[161],"Kvasir-SEG":[163],"demonstrate":[165],"consistently":[168],"outperforms":[169],"uni-modal":[170],"methods.":[173],"Furthermore,":[174],"exhibits":[176],"strong":[177],"generalization":[178],"unstructured":[180],"formats,":[182],"highlighting":[183],"its":[184],"practical":[185],"real-world":[188],"scenarios.":[190]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-05-26T13:28:51.108037","created_date":"2026-05-06T00:00:00"}
