{"id":"https://openalex.org/W7117326688","doi":"https://doi.org/10.48550/arxiv.2512.21135","title":"TGC-Net: A Structure-Aware and Semantically-Aligned Framework for Text-Guided Medical Image Segmentation","display_name":"TGC-Net: A Structure-Aware and Semantically-Aligned Framework for Text-Guided Medical Image Segmentation","publication_year":2025,"publication_date":"2025-12-24","ids":{"openalex":"https://openalex.org/W7117326688","doi":"https://doi.org/10.48550/arxiv.2512.21135"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.21135","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.21135","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.21135","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121348609","display_name":"Gaoren Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lin, Gaoren","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121313115","display_name":"Huangxuan Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Huangxuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121357278","display_name":"Yuan Xiong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiong, Yuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121363411","display_name":"Lefei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Lefei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121341727","display_name":"Bo Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Bo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5040762746","display_name":"Wentao Zhu","orcid":"https://orcid.org/0000-0002-5483-0259"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Wentao","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5121348609"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.40380001068115234,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.40380001068115234,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.25450000166893005,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.12099999934434891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6891999840736389},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6541000008583069},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6496999859809875},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.5852000117301941},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5205000042915344},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.46149998903274536},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4300999939441681}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7386999726295471},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7005000114440918},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6891999840736389},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6541000008583069},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6496999859809875},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.5852000117301941},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5205000042915344},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5034999847412109},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.46149998903274536},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4300999939441681},{"id":"https://openalex.org/C22029948","wikidata":"https://www.wikidata.org/wiki/Q45089","display_name":"Dice","level":2,"score":0.42899999022483826},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.38019999861717224},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.3790000081062317},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.37389999628067017},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.3734999895095825},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.32030001282691956},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.2815999984741211},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.26330000162124634}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.21135","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.21135","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.21135","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.21135","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Text-guided":[0],"medical":[1,44,111],"segmentation":[2,4],"enhances":[3],"accuracy":[5],"by":[6,48],"utilizing":[7],"clinical":[8,62],"reports":[9],"as":[10],"auxiliary":[11],"information.":[12],"However,":[13],"existing":[14],"methods":[15],"typically":[16],"rely":[17],"on":[18,79,129,154],"unaligned":[19],"image":[20],"and":[21,64,113,135],"text":[22],"encoders,":[23],"which":[24],"necessitate":[25],"complex":[26,61],"interaction":[27],"modules":[28],"for":[29,99],"multimodal":[30,37],"fusion.":[31],"While":[32],"CLIP":[33],"provides":[34],"a":[35,75,86,96,103,114,124],"pre-aligned":[36],"feature":[38,126],"space,":[39],"its":[40],"direct":[41],"application":[42],"to":[43],"imaging":[45],"is":[46],"limited":[47],"three":[49],"main":[50],"issues:":[51],"insufficient":[52],"preservation":[53],"of":[54,60],"fine-grained":[55],"anatomical":[56],"structures,":[57],"inadequate":[58],"modeling":[59],"descriptions,":[63],"domain-specific":[65],"semantic":[66],"misalignment.":[67],"To":[68],"tackle":[69],"these":[70],"challenges,":[71],"we":[72],"propose":[73],"TGC-Net,":[74],"CLIP-based":[76],"framework":[77],"focusing":[78],"parameter-efficient,":[80],"task-specific":[81],"adaptations.":[82],"Specifically,":[83],"it":[84],"incorporates":[85],"Semantic-Structural":[87],"Synergy":[88],"Encoder":[89,106],"(SSE)":[90],"that":[91,108,119,140],"augments":[92],"CLIP's":[93],"ViT":[94],"with":[95,145],"CNN":[97],"branch":[98],"multi-scale":[100],"structural":[101],"refinement,":[102],"Domain-Augmented":[104],"Text":[105],"(DATE)":[107],"injects":[109],"large-language-model-derived":[110],"knowledge,":[112],"Vision-Language":[115],"Calibration":[116],"Module":[117],"(VLCM)":[118],"refines":[120],"cross-modal":[121],"correspondence":[122],"in":[123],"unified":[125],"space.":[127],"Experiments":[128],"five":[130],"datasets":[131],"across":[132],"chest":[133],"X-ray":[134],"thoracic":[136],"CT":[137],"modalities":[138],"demonstrate":[139],"TGC-Net":[141],"achieves":[142],"state-of-the-art":[143],"performance":[144],"substantially":[146],"fewer":[147],"trainable":[148],"parameters,":[149],"including":[150],"notable":[151],"Dice":[152],"gains":[153],"challenging":[155],"benchmarks.":[156]},"counts_by_year":[],"updated_date":"2025-12-26T23:12:39.385286","created_date":"2025-12-26T00:00:00"}
