{"id":"https://openalex.org/W4388145644","doi":"https://doi.org/10.1109/access.2023.3329435","title":"Enhancing Semantically Masked Transformer With Local Attention for Semantic Segmentation","display_name":"Enhancing Semantically Masked Transformer With Local Attention for Semantic Segmentation","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4388145644","doi":"https://doi.org/10.1109/access.2023.3329435"},"language":"en","primary_location":{"id":"doi:10.1109/access.2023.3329435","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3329435","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10304180.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10304180.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091239059","display_name":"Zhengyu Xia","orcid":"https://orcid.org/0000-0001-5225-5580"},"institutions":[{"id":"https://openalex.org/I180949307","display_name":"Illinois Institute of Technology","ror":"https://ror.org/037t3ry66","country_code":"US","type":"education","lineage":["https://openalex.org/I180949307"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zhengyu Xia","raw_affiliation_strings":["Illinois Institute of Technology, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"Illinois Institute of Technology, Chicago, IL, USA","institution_ids":["https://openalex.org/I180949307"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076689613","display_name":"Joohee Kim","orcid":"https://orcid.org/0000-0001-8833-0319"},"institutions":[{"id":"https://openalex.org/I180949307","display_name":"Illinois Institute of Technology","ror":"https://ror.org/037t3ry66","country_code":"US","type":"education","lineage":["https://openalex.org/I180949307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Joohee Kim","raw_affiliation_strings":["Illinois Institute of Technology, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"Illinois Institute of Technology, Chicago, IL, USA","institution_ids":["https://openalex.org/I180949307"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5091239059"],"corresponding_institution_ids":["https://openalex.org/I180949307"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.7336,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.73436459,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"11","issue":null,"first_page":"122345","last_page":"122356"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8260448575019836},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7876071929931641},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.675692081451416},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6532288789749146},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6384851336479187},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.5549081563949585},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4748659133911133},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.46680524945259094},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.46282440423965454},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.41057533025741577}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8260448575019836},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7876071929931641},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.675692081451416},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6532288789749146},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6384851336479187},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.5549081563949585},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4748659133911133},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.46680524945259094},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.46282440423965454},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.41057533025741577},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2023.3329435","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3329435","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10304180.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:531bdfe54bb04fd2a2d9650705b4a73d","is_oa":true,"landing_page_url":"https://doaj.org/article/531bdfe54bb04fd2a2d9650705b4a73d","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 11, Pp 122345-122356 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2023.3329435","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2023.3329435","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10304180.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.75,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[{"id":"https://openalex.org/G5729426267","display_name":null,"funder_award_id":"1415181272","funder_id":"https://openalex.org/F4320321681","funder_display_name":"Ministry of Trade, Industry and Energy"},{"id":"https://openalex.org/G992484961","display_name":null,"funder_award_id":"Korea","funder_id":"https://openalex.org/F4320321681","funder_display_name":"Ministry of Trade, Industry and Energy"}],"funders":[{"id":"https://openalex.org/F4320309321","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44"},{"id":"https://openalex.org/F4320315121","display_name":"Samsung Advanced Institute of Technology","ror":null},{"id":"https://openalex.org/F4320321314","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96"},{"id":"https://openalex.org/F4320321370","display_name":"Inha University","ror":"https://ror.org/01easw929"},{"id":"https://openalex.org/F4320321681","display_name":"Ministry of Trade, Industry and Energy","ror":"https://ror.org/008nkqk13"},{"id":"https://openalex.org/F4320332195","display_name":"Samsung","ror":"https://ror.org/04w3jy968"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4388145644.pdf","grobid_xml":"https://content.openalex.org/works/W4388145644.grobid-xml"},"referenced_works_count":68,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1536680647","https://openalex.org/W1861492603","https://openalex.org/W1901129140","https://openalex.org/W1903029394","https://openalex.org/W2037227137","https://openalex.org/W2102605133","https://openalex.org/W2109255472","https://openalex.org/W2117539524","https://openalex.org/W2194775991","https://openalex.org/W2340897893","https://openalex.org/W2412782625","https://openalex.org/W2531409750","https://openalex.org/W2560023338","https://openalex.org/W2630837129","https://openalex.org/W2737258237","https://openalex.org/W2799213142","https://openalex.org/W2895340641","https://openalex.org/W2899663614","https://openalex.org/W2901710089","https://openalex.org/W2908510526","https://openalex.org/W2910628332","https://openalex.org/W2955058313","https://openalex.org/W2963727650","https://openalex.org/W2963840672","https://openalex.org/W2963881378","https://openalex.org/W2981689412","https://openalex.org/W3096609285","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3165745140","https://openalex.org/W3170841864","https://openalex.org/W3170874841","https://openalex.org/W3172509117","https://openalex.org/W3175515048","https://openalex.org/W3175544090","https://openalex.org/W3176659256","https://openalex.org/W3211490618","https://openalex.org/W3213165621","https://openalex.org/W4214493665","https://openalex.org/W4214669216","https://openalex.org/W4214893857","https://openalex.org/W4226213006","https://openalex.org/W4293680532","https://openalex.org/W4295312788","https://openalex.org/W4296544717","https://openalex.org/W4312349930","https://openalex.org/W4312443924","https://openalex.org/W4312815172","https://openalex.org/W4312950730","https://openalex.org/W4385245566","https://openalex.org/W6639102338","https://openalex.org/W6639824700","https://openalex.org/W6687483927","https://openalex.org/W6696085341","https://openalex.org/W6739696289","https://openalex.org/W6739901393","https://openalex.org/W6755977528","https://openalex.org/W6757817989","https://openalex.org/W6766978945","https://openalex.org/W6788135285","https://openalex.org/W6797399245","https://openalex.org/W6797790494","https://openalex.org/W6798047393","https://openalex.org/W6798837711","https://openalex.org/W6803677459","https://openalex.org/W6811016991","https://openalex.org/W6842806116"],"related_works":["https://openalex.org/W2185902295","https://openalex.org/W2103507220","https://openalex.org/W3144569342","https://openalex.org/W2945274617","https://openalex.org/W4313052709","https://openalex.org/W4205800335","https://openalex.org/W2055202857","https://openalex.org/W2022929107","https://openalex.org/W80586315","https://openalex.org/W2758994127"],"abstract_inverted_index":{"Transformer-based":[0,125],"semantic":[1,31,39,58,64,117,130,159],"segmentation":[2,49,77,126,170,176,188],"has":[3,94],"been":[4],"applied":[5],"to":[6,47,61,97,140,156,166],"various":[7],"visual":[8],"recognition":[9],"applications":[10],"and":[11,27,74,93,193,214],"achieved":[12],"outstanding":[13],"performance":[14,206],"in":[15,37],"recent":[16],"years.":[17],"Since":[18],"most":[19],"of":[20,67,82,91,123,133,151,177],"these":[21],"approaches":[22],"adopt":[23],"a":[24,57,115,124,152],"pretrained":[25],"backbone":[26,155],"finetune":[28],"it":[29],"for":[30,106,173],"segmentation,":[32],"they":[33],"are":[34,104],"not":[35],"efficient":[36],"capturing":[38],"contextual":[40,65,160],"information":[41,66,161],"during":[42,70],"the":[43,63,71,76,80,88,100,120,163,168,208,215],"encoding":[44,72],"stage,":[45],"leading":[46],"sub-optimal":[48],"performance.":[50,78],"To":[51],"address":[52],"this":[53,111],"problem,":[54],"SeMask":[55,83],"proposes":[56],"attention":[59,89],"operation":[60],"incorporate":[62],"an":[68],"image":[69],"stage":[73],"improves":[75],"However,":[79],"architecture":[81],"is":[84,146],"entirely":[85],"based":[86],"on":[87,162,207],"mechanisms":[90],"Transformers":[92],"some":[95],"limitations":[96],"fully":[98],"exploit":[99],"local":[101,143],"details,":[102],"which":[103],"important":[105],"more":[107,174],"accurate":[108,175],"segmentation.":[109],"In":[110],"paper,":[112],"we":[113],"introduce":[114],"novel":[116],"layer":[118,131],"into":[119],"encoder":[121,164],"side":[122,165],"model.":[127],"The":[128],"proposed":[129,181,201],"consists":[132],"depthwise":[134],"convolutions":[135],"with":[136,186,211,218],"different":[137,149],"kernel":[138],"sizes":[139],"capture":[141],"multi-scale":[142,158],"details.":[144],"It":[145],"integrated":[147,185],"at":[148],"stages":[150],"hierarchical":[153],"Transformer":[154],"acquire":[157],"improve":[167],"overall":[169],"performance,":[171],"especially":[172],"small":[178],"objects.":[179],"Our":[180],"method":[182,202],"can":[183,203],"be":[184],"common":[187],"models":[189],"such":[190],"as":[191],"Semantic-FPN":[192],"Mask":[194],"Transformers.":[195],"Experimental":[196],"results":[197],"show":[198],"that":[199],"our":[200],"achieve":[204],"state-of-the-art":[205],"ADE20K":[209],"dataset":[210,217],"58.24%":[212],"mIoU":[213],"Cityscapes":[216],"84.97%":[219],"mIoU.":[220]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
