{"id":"https://openalex.org/W4399435719","doi":"https://doi.org/10.1145/3652583.3658006","title":"SFAM: Lightweight Spectrum Unreferenced Attention Network","display_name":"SFAM: Lightweight Spectrum Unreferenced Attention Network","publication_year":2024,"publication_date":"2024-05-30","ids":{"openalex":"https://openalex.org/W4399435719","doi":"https://doi.org/10.1145/3652583.3658006"},"language":"en","primary_location":{"id":"doi:10.1145/3652583.3658006","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3652583.3658006","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3658006","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3658006","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Xuanhao Qi","orcid":"https://orcid.org/0009-0001-4332-7930"},"institutions":[{"id":"https://openalex.org/I22046295","display_name":"Inner Mongolia Normal University","ror":"https://ror.org/0497ase59","country_code":"CN","type":"education","lineage":["https://openalex.org/I22046295"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xuanhao Qi","raw_affiliation_strings":["College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China"],"raw_orcid":"https://orcid.org/0009-0001-4332-7930","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China","institution_ids":["https://openalex.org/I22046295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056958899","display_name":"Min Zhi","orcid":"https://orcid.org/0009-0001-3069-8628"},"institutions":[{"id":"https://openalex.org/I22046295","display_name":"Inner Mongolia Normal University","ror":"https://ror.org/0497ase59","country_code":"CN","type":"education","lineage":["https://openalex.org/I22046295"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Min Zhi","raw_affiliation_strings":["College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China"],"raw_orcid":"https://orcid.org/0009-0001-3069-8628","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China","institution_ids":["https://openalex.org/I22046295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039488408","display_name":"Yanjun Yin","orcid":"https://orcid.org/0009-0009-0758-1016"},"institutions":[{"id":"https://openalex.org/I22046295","display_name":"Inner Mongolia Normal University","ror":"https://ror.org/0497ase59","country_code":"CN","type":"education","lineage":["https://openalex.org/I22046295"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanjun Yin","raw_affiliation_strings":["College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China"],"raw_orcid":"https://orcid.org/0009-0009-0758-1016","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China","institution_ids":["https://openalex.org/I22046295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102831832","display_name":"Ping Ping","orcid":"https://orcid.org/0009-0007-6597-1165"},"institutions":[{"id":"https://openalex.org/I22046295","display_name":"Inner Mongolia Normal University","ror":"https://ror.org/0497ase59","country_code":"CN","type":"education","lineage":["https://openalex.org/I22046295"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ping Ping","raw_affiliation_strings":["College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China"],"raw_orcid":"https://orcid.org/0009-0007-6597-1165","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China","institution_ids":["https://openalex.org/I22046295"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045346321","display_name":"Y. Zhang","orcid":"https://orcid.org/0009-0008-6317-1743"},"institutions":[{"id":"https://openalex.org/I22046295","display_name":"Inner Mongolia Normal University","ror":"https://ror.org/0497ase59","country_code":"CN","type":"education","lineage":["https://openalex.org/I22046295"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuening Zhang","raw_affiliation_strings":["College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China"],"raw_orcid":"https://orcid.org/0009-0008-6317-1743","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Inner Mongolia Normal University, Hohhot, China","institution_ids":["https://openalex.org/I22046295"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I22046295"],"apc_list":null,"apc_paid":null,"fwci":0.4762,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.61398926,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"749","last_page":"757"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6905329823493958},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6474617123603821},{"id":"https://openalex.org/keywords/discrete-cosine-transform","display_name":"Discrete cosine transform","score":0.6430140733718872},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5886214971542358},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5858244299888611},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.5029889941215515},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.4704011380672455},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4636138081550598},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4635355472564697},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4228053092956543},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3905634880065918},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2991759777069092},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.2866009473800659},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1014244556427002}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6905329823493958},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6474617123603821},{"id":"https://openalex.org/C2221639","wikidata":"https://www.wikidata.org/wiki/Q2877","display_name":"Discrete cosine transform","level":3,"score":0.6430140733718872},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5886214971542358},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5858244299888611},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.5029889941215515},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.4704011380672455},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4636138081550598},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4635355472564697},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4228053092956543},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3905634880065918},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2991759777069092},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2866009473800659},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1014244556427002},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3652583.3658006","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3652583.3658006","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3658006","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3652583.3658006","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3652583.3658006","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3658006","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4399435719.pdf"},"referenced_works_count":16,"referenced_works":["https://openalex.org/W2031614119","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2752782242","https://openalex.org/W2797514659","https://openalex.org/W2963125010","https://openalex.org/W3034429256","https://openalex.org/W3121523901","https://openalex.org/W3131500599","https://openalex.org/W3133696297","https://openalex.org/W3138516171","https://openalex.org/W4214493665","https://openalex.org/W4214709605","https://openalex.org/W4312820606","https://openalex.org/W4313007769","https://openalex.org/W6790690058"],"related_works":["https://openalex.org/W1916685473","https://openalex.org/W2055682261","https://openalex.org/W1993363272","https://openalex.org/W2186390138","https://openalex.org/W2060035984","https://openalex.org/W2790129917","https://openalex.org/W2992856432","https://openalex.org/W2100638064","https://openalex.org/W2127787376","https://openalex.org/W2534655758"],"abstract_inverted_index":{"The":[0,70,88,103,142,154,207,254],"construction":[1],"of":[2,11,23,30,44,80,96,170,181,187,218,246,256],"deep":[3],"neural":[4],"networks":[5],"depends":[6],"on":[7,220,225,233],"a":[8,18,50,57,64,157],"significant":[9],"number":[10,180,245,255],"parameters":[12,257],"and":[13,37,63,72,131,138,161,231,241,252,263,267],"computational":[14],"complexity,":[15],"which":[16],"poses":[17],"challenge":[19],"in":[20,85,150,173,190],"the":[21,28,31,45,78,81,86,94,97,106,113,116,120,127,136,147,151,174,179,185,191,203,212,221,226,234,244],"field":[22],"image":[24,114,129],"processing.":[25],"To":[26],"address":[27],"issue":[29],"Transformer":[32,53],"network":[33,204],"model's":[34,205],"large":[35],"size":[36],"inability":[38],"to":[39,76,92,111,119,145,166,200,238],"effectively":[40],"capture":[41],"local":[42,171,188],"features":[43,83,149,169,189],"image,":[46],"this":[47],"paper":[48],"proposes":[49],"lightweight":[51],"composite":[52],"structure":[54,90,130],"that":[55,211],"combines":[56],"spectral":[58,82],"feature":[59,133],"refinement":[60],"module":[61,68],"(SFRM)":[62],"parameterless":[65],"attention":[66,163],"augmentation":[67],"(PAAM).":[69],"SFRM":[71,104],"PAAM":[73,155],"work":[74],"together":[75],"improve":[77],"quality":[79],"used":[84],"transformer.":[87],"proposed":[89,213],"aims":[91],"enhance":[93],"performance":[95],"transformer":[98],"without":[99,177],"adding":[100],"unnecessary":[101],"complexity.":[102],"utilises":[105],"two-dimensional":[107],"discrete":[108],"cosine":[109],"transform":[110],"convert":[112],"from":[115,135],"spatial":[117,175],"domain":[118,176],"frequency":[121],"domain.":[122],"This":[123,183],"process":[124],"extracts":[125],"both":[126],"overall":[128],"detailed":[132],"information":[134,172],"high-frequency":[137],"low-frequency":[139],"regions,":[140],"respectively.":[141,269],"aim":[143],"is":[144,198,258],"purify":[146],"spatially-insignificant":[148],"original":[152],"image.":[153,192],"introduces":[156],"parameter-free":[158],"channel,":[159],"spatial,":[160],"3D":[162],"enhancement":[164],"mechanism":[165],"extract":[167],"correlation":[168],"increasing":[178],"parameters.":[182],"improves":[184],"expression":[186],"Additionally,":[193],"Depth":[194],"Separable":[195],"(DConv":[196],"MLP)":[197],"introduced":[199],"further":[201],"reduce":[202],"weight.":[206],"experimental":[208],"results":[209],"show":[210],"algorithm":[214],"achieves":[215],"an":[216],"accuracy":[217],"79.6%":[219],"ImageNet-1K":[222],"dataset,":[223],"91.6%":[224],"Oxford":[227],"102":[228],"Flower":[229],"Dataset,":[230],"94.1%":[232],"CIFAR-10":[235],"dataset.":[236],"Compared":[237],"ViT-B,":[239],"Swin-T,":[240],"CSwin-T,":[242],"respectively,":[243],"covariates":[247],"decreases":[248],"by":[249,265],"86.11%,":[250],"58.62%,":[251],"47.83%.":[253],"also":[259],"lower":[260],"than":[261],"VGG-16":[262],"ResNet-110":[264],"91.07%":[266],"77.70%,":[268]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
