{"id":"https://openalex.org/W4402916037","doi":"https://doi.org/10.1109/icip51287.2024.10648129","title":"Spatial Plaid Attention Decoder for Semantic Segmentation","display_name":"Spatial Plaid Attention Decoder for Semantic Segmentation","publication_year":2024,"publication_date":"2024-09-27","ids":{"openalex":"https://openalex.org/W4402916037","doi":"https://doi.org/10.1109/icip51287.2024.10648129"},"language":"en","primary_location":{"id":"doi:10.1109/icip51287.2024.10648129","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icip51287.2024.10648129","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015224305","display_name":"Abolfazl Meyarian","orcid":null},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abolfazl Meyarian","raw_affiliation_strings":["University of North Texas,Department of Computer Science and Engineering,Denton,TX,76203"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Texas,Department of Computer Science and Engineering,Denton,TX,76203","institution_ids":["https://openalex.org/I123534392"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101543726","display_name":"Xiaohui Yuan","orcid":"https://orcid.org/0000-0003-0661-5332"},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaohui Yuan","raw_affiliation_strings":["University of North Texas,Department of Computer Science and Engineering,Denton,TX,76203"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Texas,Department of Computer Science and Engineering,Denton,TX,76203","institution_ids":["https://openalex.org/I123534392"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033267613","display_name":"Zhinan Qiao","orcid":"https://orcid.org/0000-0002-8103-3829"},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhinan Qiao","raw_affiliation_strings":["University of North Texas,Department of Computer Science and Engineering,Denton,TX,76203"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Texas,Department of Computer Science and Engineering,Denton,TX,76203","institution_ids":["https://openalex.org/I123534392"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I123534392"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14788981,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"34","issue":null,"first_page":"2723","last_page":"2729"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9140999913215637,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9140999913215637,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7638868093490601},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6407027840614319},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5877751111984253},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.36673569679260254},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.35592466592788696},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.34592217206954956},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33027034997940063}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7638868093490601},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6407027840614319},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5877751111984253},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.36673569679260254},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35592466592788696},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.34592217206954956},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33027034997940063}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icip51287.2024.10648129","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icip51287.2024.10648129","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5400000214576721,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2125556102","https://openalex.org/W2340897893","https://openalex.org/W2560023338","https://openalex.org/W2565639579","https://openalex.org/W2598666589","https://openalex.org/W2601564443","https://openalex.org/W2737258237","https://openalex.org/W2787091153","https://openalex.org/W2884822772","https://openalex.org/W2963446712","https://openalex.org/W2963604034","https://openalex.org/W2963727650","https://openalex.org/W2963881378","https://openalex.org/W3094502228","https://openalex.org/W3110908156","https://openalex.org/W3113817926","https://openalex.org/W3171398643","https://openalex.org/W3197957534","https://openalex.org/W3211490618","https://openalex.org/W4385245566","https://openalex.org/W4386071839","https://openalex.org/W4386076340","https://openalex.org/W6789041250","https://openalex.org/W6790690058","https://openalex.org/W6797784111","https://openalex.org/W6799041125","https://openalex.org/W6842806116","https://openalex.org/W6842890524"],"related_works":["https://openalex.org/W4379231730","https://openalex.org/W4389858081","https://openalex.org/W2501551404","https://openalex.org/W4385583601","https://openalex.org/W4298131179","https://openalex.org/W2113201962","https://openalex.org/W4395685956","https://openalex.org/W2799953226","https://openalex.org/W4398146871","https://openalex.org/W3204400600"],"abstract_inverted_index":{"Striking":[0],"a":[1,8,31,44,86,95,150],"balance":[2],"between":[3],"efficiency":[4],"and":[5,13,25,81,115,120,131],"accuracy":[6],"is":[7,158],"challenge":[9],"in":[10],"the":[11,62,65,77,126,138,156],"design":[12,140],"implementation":[14],"of":[15,68,97,141,155],"decoders.":[16],"Accurate":[17],"decoders":[18],"often":[19],"tend":[20],"to":[21,60,75,145],"be":[22],"highly":[23],"complex":[24],"computationally":[26],"costly.":[27],"This":[28,83],"paper":[29],"presents":[30],"novel":[32],"decoder":[33],"for":[34,89],"semantic":[35],"segmentation:":[36],"Spatial":[37,45],"Plaid":[38,46],"Attention":[39,47],"Decoder":[40],"(SPADe).":[41],"We":[42,134],"propose":[43],"module":[48],"that":[49,137],"performs":[50],"an":[51],"efficient":[52],"local":[53,66],"feature":[54,58,73],"collection":[55],"through":[56],"spatial":[57],"folding":[59],"help":[61],"model":[63],"capture":[64,146],"structure":[67],"objects":[69],"while":[70,124],"using":[71],"long-range":[72,147],"aggregation":[74],"consider":[76],"global":[78],"structures":[79],"efficiently":[80],"accurately.":[82],"makes":[84],"SPADe":[85,102,117,142,157],"suitable":[87],"choice":[88],"applications":[90],"with":[91,106,149],"limited":[92],"resources.":[93],"With":[94],"size":[96],"7.3%":[98],"UPerNet":[99],"decoder,":[100],"our":[101],"obtains":[103,118],"state-of-the-art":[104],"performance":[105],"several":[107],"popular":[108],"backbones":[109],"on":[110],"public":[111],"benchmarks.":[112],"On":[113],"Cityscapes":[114],"ADE20K,":[116],"84.3%":[119],"$53.8":[121],"\\%":[122],"\\mathrm{mIoU}$,":[123],"reducing":[125],"total":[127],"GFlops":[128],"by":[129],"32.8%":[130],"70.5%,":[132],"respectively.":[133],"also":[135],"demonstrate":[136],"effective":[139],"allows":[143],"it":[144],"dependencies":[148],"large":[151],"receptive":[152],"field.":[153],"Implementation":[154],"available":[159],"at":[160],"github/SPADe.":[161]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
