{"id":"https://openalex.org/W4402352818","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650648","title":"An Efficient Spatial Modeling Conv-ViT using Mask Supervision for 3D Medical Image Segmentation","display_name":"An Efficient Spatial Modeling Conv-ViT using Mask Supervision for 3D Medical Image Segmentation","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4402352818","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650648"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn60899.2024.10650648","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10650648","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082588749","display_name":"Jiaxing Tian","orcid":"https://orcid.org/0000-0002-1473-8474"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiaxing Tian","raw_affiliation_strings":["Dalian University of Technology,School of Computer Science and Technology,Dalian,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Computer Science and Technology,Dalian,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019395532","display_name":"Bingcai Chen","orcid":"https://orcid.org/0000-0001-7158-6537"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bingcai Chen","raw_affiliation_strings":["Dalian University of Technology,School of Computer Science and Technology,Dalian,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Computer Science and Technology,Dalian,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113004816","display_name":"Qianyu Li","orcid":null},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qianyu Li","raw_affiliation_strings":["Dalian University of Technology,School of Computer Science and Technology,Dalian,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Computer Science and Technology,Dalian,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032188646","display_name":"Ruolan Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruolan Liu","raw_affiliation_strings":["Dalian University of Technology,School of Computer Science and Technology,Dalian,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Computer Science and Technology,Dalian,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024633414","display_name":"Yuanchao Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I1334729051","display_name":"Xinjiang Normal University","ror":"https://ror.org/00ndrvk93","country_code":"CN","type":"education","lineage":["https://openalex.org/I1334729051"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanchao Feng","raw_affiliation_strings":["Xinjiang Normal University,College of Computer Science and Technology,Urumqi,China"],"affiliations":[{"raw_affiliation_string":"Xinjiang Normal University,College of Computer Science and Technology,Urumqi,China","institution_ids":["https://openalex.org/I1334729051"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5082588749"],"corresponding_institution_ids":["https://openalex.org/I27357992"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14631048,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"35","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7252850532531738},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.6639658212661743},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6203914284706116},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5957468152046204},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.47598424553871155},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.47034600377082825},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3232682943344116}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7252850532531738},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.6639658212661743},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6203914284706116},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5957468152046204},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.47598424553871155},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.47034600377082825},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3232682943344116}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn60899.2024.10650648","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10650648","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W2752782242","https://openalex.org/W2963163009","https://openalex.org/W2982101047","https://openalex.org/W3034421924","https://openalex.org/W3094502228","https://openalex.org/W3127751679","https://openalex.org/W3138516171","https://openalex.org/W3195135988","https://openalex.org/W3198020043","https://openalex.org/W3203841574","https://openalex.org/W3204255739","https://openalex.org/W4212875960","https://openalex.org/W4225368580","https://openalex.org/W4283072464","https://openalex.org/W4296412923","https://openalex.org/W4298110661","https://openalex.org/W4302009076","https://openalex.org/W4302363625","https://openalex.org/W4312225519","https://openalex.org/W4312428231","https://openalex.org/W4312443924","https://openalex.org/W4321232185","https://openalex.org/W4384159609","https://openalex.org/W4387211248","https://openalex.org/W4390189979","https://openalex.org/W6767312599","https://openalex.org/W6784333009","https://openalex.org/W6790275670","https://openalex.org/W6839656003","https://openalex.org/W6843259600","https://openalex.org/W6845563047","https://openalex.org/W6847258573"],"related_works":["https://openalex.org/W4379231730","https://openalex.org/W4389858081","https://openalex.org/W2501551404","https://openalex.org/W4385583601","https://openalex.org/W4298131179","https://openalex.org/W2113201962","https://openalex.org/W4395685956","https://openalex.org/W2799953226","https://openalex.org/W4398146871","https://openalex.org/W1522196789"],"abstract_inverted_index":{"Transformer-CNN":[0],"hybrid":[1],"models":[2,5,17,178],"and":[3,27,40,82,166,191],"ConvNeXt-based":[4],"have":[6,18],"demonstrated":[7],"notable":[8],"success":[9],"in":[10,36,111,142],"3D":[11,72,100],"medical":[12,73,112],"image":[13],"segmentation.":[14],"However,":[15],"these":[16],"redundancy":[19],"problems":[20],"with":[21,67,183],"a":[22,62],"large":[23],"number":[24],"of":[25,30,80,88,99,107,109,127,193],"parameters":[26],"fall":[28],"short":[29],"capturing":[31],"semantic":[32,122,136,153],"information":[33,70],"effectively,":[34],"resulting":[35],"high":[37,188],"modeling":[38,53,86,189],"costs":[39],"limitations":[41],"on":[42,158,179],"segmentation":[43,163],"performance.":[44],"Motivated":[45],"by":[46],"this,":[47],"we":[48,119],"propose":[49],"an":[50,131],"efficient":[51,132],"spatial":[52],"Convolutional":[54],"Vision":[55],"Transformer":[56,90],"using":[57],"Mask":[58,116],"Supervision.":[59],"We":[60,94,155],"design":[61],"convolutional":[63],"encoding":[64],"block":[65],"embedded":[66],"global":[68,85],"context":[69],"for":[71,140],"images":[74],"so":[75],"that":[76,172],"the":[77,83,89,97,105,115,121,128,146,187],"inductive":[78],"bias":[79],"CNN":[81],"powerful":[84],"capability":[87],"are":[91],"effectively":[92],"integrated.":[93],"also":[95],"adopt":[96],"structure":[98],"Dynamic":[101],"Convolution":[102],"to":[103,149],"alleviate":[104],"problem":[106],"anisotropy":[108],"features":[110],"images.":[113],"In":[114],"Supervision":[117],"strategy,":[118],"acquire":[120],"mask":[123,137],"after":[124],"each":[125],"stage":[126],"encoder":[129],"through":[130],"attention":[133],"mechanism.":[134],"The":[135,168],"is":[138],"employed":[139],"supervision":[141],"model":[143,174],"training,":[144],"enhancing":[145],"model\u2019s":[147],"capacity":[148],"assimilate":[150],"more":[151],"intricate":[152],"information.":[154],"conducted":[156],"experiments":[157],"two":[159],"authoritative":[160],"abdominal":[161],"multi-organ":[162],"datasets,":[164],"AMOS2022":[165],"WORD.":[167],"experimental":[169],"results":[170],"show":[171],"our":[173,194],"outperforms":[175],"all":[176],"competitive":[177],"both":[180],"datasets(AMOS2022:90.00,":[181],"WORD:86.28)":[182],"fewer":[184],"parameters(32.53M),":[185],"demonstrating":[186],"efficiency":[190],"effectiveness":[192],"methods.":[195]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
