{"id":"https://openalex.org/W7076054171","doi":"https://doi.org/10.1109/tgrs.2025.3599214","title":"AFSIFormer: Adaptive Frequency\u2013Spatial Interaction Attention Mechanism for Aerial Image Semantic Segmentation","display_name":"AFSIFormer: Adaptive Frequency\u2013Spatial Interaction Attention Mechanism for Aerial Image Semantic Segmentation","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W7076054171","doi":"https://doi.org/10.1109/tgrs.2025.3599214"},"language":"en","primary_location":{"id":"doi:10.1109/tgrs.2025.3599214","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2025.3599214","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Jie Hui","orcid":"https://orcid.org/0009-0002-8519-3800"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jie Hui","raw_affiliation_strings":["State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0009-0002-8519-3800","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Wenyu Mi","orcid":"https://orcid.org/0000-0002-4777-5327"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenyu Mi","raw_affiliation_strings":["State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0002-4777-5327","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jianji Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianji Wang","raw_affiliation_strings":["State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yuanyang Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanyang Cao","raw_affiliation_strings":["State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Ziyi Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I69356397","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05","country_code":"CN","type":"education","lineage":["https://openalex.org/I69356397"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziyi Zhou","raw_affiliation_strings":["School of AI and Advanced Computing, Xi&#x2019;an Jiaotong-Liverpool University, Nanjing, Jiangsu, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of AI and Advanced Computing, Xi&#x2019;an Jiaotong-Liverpool University, Nanjing, Jiangsu, China","institution_ids":["https://openalex.org/I69356397"]}]},{"author_position":"last","author":{"id":null,"display_name":"Nanning Zheng","orcid":"https://orcid.org/0000-0003-1608-8257"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nanning Zheng","raw_affiliation_strings":["State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0003-1608-8257","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Human-Machine Hybrid Augmented Intelligence, the National Engineering Research Center for Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I87445476"],"apc_list":null,"apc_paid":null,"fwci":1.1219,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.83801498,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"63","issue":null,"first_page":"1","last_page":"19"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10591","display_name":"Theoretical and Computational Physics","score":0.03849999979138374,"subfield":{"id":"https://openalex.org/subfields/3104","display_name":"Condensed Matter Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10591","display_name":"Theoretical and Computational Physics","score":0.03849999979138374,"subfield":{"id":"https://openalex.org/subfields/3104","display_name":"Condensed Matter Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12613","display_name":"X-ray Diffraction in Crystallography","score":0.02539999969303608,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12579","display_name":"Muon and positron interactions and applications","score":0.021800000220537186,"subfield":{"id":"https://openalex.org/subfields/2211","display_name":"Mechanics of Materials"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5997999906539917},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5080999732017517},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.4765999913215637},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4650000035762787},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4447999894618988},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4413999915122986},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4352000057697296},{"id":"https://openalex.org/keywords/aerial-image","display_name":"Aerial image","score":0.4074999988079071},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.39399999380111694}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8356000185012817},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.663100004196167},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5997999906539917},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5080999732017517},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.4765999913215637},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4650000035762787},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4462999999523163},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4447999894618988},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4413999915122986},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4352000057697296},{"id":"https://openalex.org/C2776429412","wikidata":"https://www.wikidata.org/wiki/Q4688011","display_name":"Aerial image","level":3,"score":0.4074999988079071},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.39399999380111694},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3912999927997589},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3686000108718872},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.33399999141693115},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3093000054359436},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3091000020503998},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.29499998688697815},{"id":"https://openalex.org/C39399123","wikidata":"https://www.wikidata.org/wiki/Q1348989","display_name":"Earth observation","level":3,"score":0.2874999940395355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2851000130176544},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.2849999964237213},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.2847999930381775},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.27880001068115234},{"id":"https://openalex.org/C38764148","wikidata":"https://www.wikidata.org/wiki/Q17098245","display_name":"Interaction information","level":2,"score":0.27250000834465027},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C57493831","wikidata":"https://www.wikidata.org/wiki/Q3134666","display_name":"Projection (relational algebra)","level":2,"score":0.2685000002384186},{"id":"https://openalex.org/C33326189","wikidata":"https://www.wikidata.org/wiki/Q17092450","display_name":"Information integration","level":2,"score":0.25920000672340393},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.25870001316070557},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.2526000142097473}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tgrs.2025.3599214","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2025.3599214","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4373385012149811,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G3833898155","display_name":null,"funder_award_id":"62088102","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":75,"referenced_works":["https://openalex.org/W1655403841","https://openalex.org/W1901129140","https://openalex.org/W1903029394","https://openalex.org/W2018342351","https://openalex.org/W2303475025","https://openalex.org/W2560023338","https://openalex.org/W2787091153","https://openalex.org/W2886934227","https://openalex.org/W2890671392","https://openalex.org/W2942454403","https://openalex.org/W2954896312","https://openalex.org/W2955058313","https://openalex.org/W2981689412","https://openalex.org/W3011147769","https://openalex.org/W3034307881","https://openalex.org/W3034552520","https://openalex.org/W3046711384","https://openalex.org/W3047725879","https://openalex.org/W3048631361","https://openalex.org/W3086017879","https://openalex.org/W3109998321","https://openalex.org/W3127751679","https://openalex.org/W3128592650","https://openalex.org/W3129029680","https://openalex.org/W3138516171","https://openalex.org/W3161825146","https://openalex.org/W3180045188","https://openalex.org/W3190334976","https://openalex.org/W3199003182","https://openalex.org/W3202923600","https://openalex.org/W4205138939","https://openalex.org/W4214532801","https://openalex.org/W4214893857","https://openalex.org/W4283450732","https://openalex.org/W4289752563","https://openalex.org/W4290715747","https://openalex.org/W4292826140","https://openalex.org/W4312349930","https://openalex.org/W4318149001","https://openalex.org/W4318586159","https://openalex.org/W4386075524","https://openalex.org/W4386597693","https://openalex.org/W4386634500","https://openalex.org/W4387723088","https://openalex.org/W4388145570","https://openalex.org/W4388532427","https://openalex.org/W4389286635","https://openalex.org/W4389355346","https://openalex.org/W4390607656","https://openalex.org/W4390660187","https://openalex.org/W4390872147","https://openalex.org/W4390873471","https://openalex.org/W4390874070","https://openalex.org/W4391878073","https://openalex.org/W4392523428","https://openalex.org/W4392543906","https://openalex.org/W4392980175","https://openalex.org/W4396534863","https://openalex.org/W4396731180","https://openalex.org/W4399039901","https://openalex.org/W4399618753","https://openalex.org/W4399728165","https://openalex.org/W4400579361","https://openalex.org/W4400727268","https://openalex.org/W4402389514","https://openalex.org/W4402775847","https://openalex.org/W4402863879","https://openalex.org/W4404479613","https://openalex.org/W4404628512","https://openalex.org/W4405845035","https://openalex.org/W4406892479","https://openalex.org/W4407316391","https://openalex.org/W4407451533","https://openalex.org/W4409225836","https://openalex.org/W4410050224"],"related_works":[],"abstract_inverted_index":{"Aerial":[0],"image":[1,224],"semantic":[2],"segmentation":[3,225],"continues":[4],"to":[5,117,144],"face":[6],"significant":[7],"challenges":[8],"in":[9],"accurately":[10],"capturing":[11],"boundary":[12,36],"textures.":[13],"While":[14],"convolutional":[15,193],"neural":[16],"networks":[17],"(CNNs)":[18],"and":[19,27,50,105,128,168,173,200],"transformers":[20],"are":[21,107],"effective":[22],"at":[23,231],"modeling":[24,99],"local":[25,85,98],"features":[26],"long-range":[28,79],"contextual":[29,91,119],"dependencies,":[30],"they":[31],"often":[32],"struggle":[33],"with":[34,158],"fine-grained":[35,97],"representation.":[37],"In":[38,53],"contrast,":[39],"frequency-domain":[40,147,201],"information":[41,92,120],"offers":[42],"complementary":[43],"advantages":[44],"by":[45],"effectively":[46],"representing":[47],"periodic":[48],"textures":[49],"structural":[51],"edges.":[52],"this":[54,134],"article,":[55],"we":[56,177],"propose":[57],"a":[58,67,72,84,137,179,188],"novel":[59],"adaptive":[60,112],"frequency\u2013spatial":[61,113,211],"interaction":[62,114],"transformer":[63],"(AFSIFormer)":[64],"that":[65,184],"follows":[66],"progressive":[68],"learning":[69,167],"strategy.":[70],"First,":[71],"boundary-aware":[73],"directional":[74],"attention":[75,87,115,151,160],"mechanism":[76,88,135],"(BADAM)":[77],"captures":[78],"dependencies":[80],"across":[81,121],"windows.":[82,123],"Then,":[83],"window":[86],"(LWAM)":[89],"refines":[90],"within":[93,191],"each":[94,150,192],"window,":[95],"enabling":[96],"under":[100],"global":[101,199],"guidance.":[102],"Both":[103],"BADAM":[104],"LWAM":[106],"built":[108],"upon":[109],"our":[110],"designed":[111],"(AFSIAttention)":[116],"capture":[118],"different":[122],"Unlike":[124],"the":[125,204,209,216],"existing":[126],"frequency-":[127],"spatial-domain":[129],"external":[130],"coarse":[131],"integration":[132,170],"strategies,":[133],"utilizes":[136],"head-specific":[138],"lightweight":[139],"frequency":[140,154,172],"projection":[141],"network":[142,212],"(HS-LFPN)":[143],"dynamically":[145],"generate":[146],"weights":[148,155],"for":[149],"head.":[152],"These":[153,206],"interact":[156],"adaptively":[157],"spatial":[159,165,174],"(SpatAttn)":[161],"weights,":[162],"facilitating":[163],"frequency-guided":[164],"feature":[166],"internal":[169],"of":[171,198],"information.":[175],"Furthermore,":[176],"design":[178],"block-level":[180],"residual":[181,189],"coupling":[182],"architecture":[183],"embeds":[185],"AFSIFormer":[186],"as":[187],"module":[190],"stage,":[194],"allowing":[195],"continuous":[196],"infusion":[197],"cues":[202],"throughout":[203],"network.":[205],"collectively":[207],"constitute":[208],"synergistic":[210],"(SynFSNet),":[213],"which":[214],"achieves":[215],"state-of-the-art":[217],"(SOTA)":[218],"performance":[219],"on":[220],"three":[221],"benchmark":[222],"aerial":[223],"datasets.":[226],"The":[227],"code":[228],"is":[229],"available":[230],"<uri":[232],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[233],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/Xinmu-Tantai/SynFSNet</uri>":[234]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
