{"id":"https://openalex.org/W7106036877","doi":"https://doi.org/10.1109/lgrs.2025.3634729","title":"Strip-ViTAE: A Direction-Aware Transformer With Enhanced Feature Modeling for Remote Sensing Image Object Detection","display_name":"Strip-ViTAE: A Direction-Aware Transformer With Enhanced Feature Modeling for Remote Sensing Image Object Detection","publication_year":2025,"publication_date":"2025-11-19","ids":{"openalex":"https://openalex.org/W7106036877","doi":"https://doi.org/10.1109/lgrs.2025.3634729"},"language":null,"primary_location":{"id":"doi:10.1109/lgrs.2025.3634729","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lgrs.2025.3634729","pdf_url":null,"source":{"id":"https://openalex.org/S126920919","display_name":"IEEE Geoscience and Remote Sensing Letters","issn_l":"1545-598X","issn":["1545-598X","1558-0571"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Geoscience and Remote Sensing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Minqi Lin","orcid":"https://orcid.org/0009-0009-3013-9453"},"institutions":[{"id":"https://openalex.org/I4210115570","display_name":"National Space Science Center","ror":"https://ror.org/02nnjtm50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210115570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Minqi Lin","raw_affiliation_strings":["Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China","institution_ids":["https://openalex.org/I4210115570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hongzhen Chen","orcid":"https://orcid.org/0000-0002-0181-9742"},"institutions":[{"id":"https://openalex.org/I4210115570","display_name":"National Space Science Center","ror":"https://ror.org/02nnjtm50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210115570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongzhen Chen","raw_affiliation_strings":["Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China","institution_ids":["https://openalex.org/I4210115570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Chenzheng Li","orcid":null},"institutions":[{"id":"https://openalex.org/I4210115570","display_name":"National Space Science Center","ror":"https://ror.org/02nnjtm50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210115570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenzheng Li","raw_affiliation_strings":["Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China","institution_ids":["https://openalex.org/I4210115570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Guangyuan Liu","orcid":"https://orcid.org/0000-0003-2725-0918"},"institutions":[{"id":"https://openalex.org/I4210115570","display_name":"National Space Science Center","ror":"https://ror.org/02nnjtm50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210115570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guangyuan Liu","raw_affiliation_strings":["Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China","institution_ids":["https://openalex.org/I4210115570"]}]},{"author_position":"last","author":{"id":null,"display_name":"Chunjiang Bian","orcid":"https://orcid.org/0000-0003-4867-0137"},"institutions":[{"id":"https://openalex.org/I4210115570","display_name":"National Space Science Center","ror":"https://ror.org/02nnjtm50","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210115570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunjiang Bian","raw_affiliation_strings":["Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Key Laboratory of Electronics and Information Technology for Space Systems, National Space Science Center, Beijing, China","institution_ids":["https://openalex.org/I4210115570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210115570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.58047847,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"23","issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.6297000050544739,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.6297000050544739,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.13009999692440033,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.08900000154972076,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6137999892234802},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5508000254631042},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.5354999899864197},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.46399998664855957},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.46230000257492065},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.43130001425743103},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.427700012922287},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.39169999957084656}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7476999759674072},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6518999934196472},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6137999892234802},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.558899998664856},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5508000254631042},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.5354999899864197},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.46399998664855957},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.46230000257492065},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.43130001425743103},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.427700012922287},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.39169999957084656},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37869998812675476},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.3610999882221222},{"id":"https://openalex.org/C110384440","wikidata":"https://www.wikidata.org/wiki/Q1143270","display_name":"Upsampling","level":3,"score":0.33410000801086426},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.32749998569488525},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.3181000053882599},{"id":"https://openalex.org/C205372480","wikidata":"https://www.wikidata.org/wiki/Q210521","display_name":"Image resolution","level":2,"score":0.3052999973297119},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.30390000343322754},{"id":"https://openalex.org/C183365957","wikidata":"https://www.wikidata.org/wiki/Q17140402","display_name":"Remote sensing application","level":3,"score":0.2892000079154968},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.27090001106262207}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lgrs.2025.3634729","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lgrs.2025.3634729","pdf_url":null,"source":{"id":"https://openalex.org/S126920919","display_name":"IEEE Geoscience and Remote Sensing Letters","issn_l":"1545-598X","issn":["1545-598X","1558-0571"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Geoscience and Remote Sensing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2962749812","https://openalex.org/W2963849369","https://openalex.org/W2964979676","https://openalex.org/W2966926453","https://openalex.org/W3170033848","https://openalex.org/W3174873843","https://openalex.org/W4210925408","https://openalex.org/W4214648418","https://openalex.org/W4311187017","https://openalex.org/W4312335509","https://openalex.org/W4312446817","https://openalex.org/W4312795296","https://openalex.org/W4312804579","https://openalex.org/W4387801831","https://openalex.org/W4390873076","https://openalex.org/W4401992000","https://openalex.org/W4402352155","https://openalex.org/W4402667905","https://openalex.org/W4404914866","https://openalex.org/W4406171817"],"related_works":[],"abstract_inverted_index":{"Recently,":[0],"ViTAE-RVSA,":[1],"the":[2,14,46,75,100,148,158,165,175],"first":[3],"large-scale":[4],"Vision":[5],"Transformer":[6],"(ViT)":[7],"tailored":[8],"for":[9,51,108,167],"remote":[10],"sensing,":[11],"has":[12],"demonstrated":[13],"potential":[15],"of":[16,123,177],"ViTs":[17],"by":[18,161,172],"integrating":[19],"window":[20],"attention":[21],"with":[22],"a":[23,65,70,85,116,124,130,136],"convolutional":[24],"branch.":[25],"However,":[26],"as":[27],"this":[28],"branch":[29],"still":[30],"adopts":[31],"isotropic":[32],"square":[33],"kernels":[34,96],"and":[35,55,93,103,110,135,163,169],"conventional":[36],"Feature":[37,118],"Pyramid":[38,119],"Networks":[39],"neglect":[40],"directional":[41],"priors":[42],"in":[43,74],"multi-scale":[44],"fusion,":[45],"resulting":[47],"representations":[48],"remain":[49],"suboptimal":[50],"arbitrarily":[52],"oriented,":[53],"high-aspect-ratio,":[54],"small":[56,111,170],"objects.":[57,112],"To":[58],"overcome":[59],"these":[60],"limitations,":[61],"we":[62,83,114],"propose":[63],"Strip-ViTAE,":[64],"transformer-based":[66],"detector":[67],"that":[68,152],"embeds":[69],"rotation-equivariant":[71],"convolution":[72],"(R2Conv)":[73],"backbone":[76],"to":[77,97,141],"capture":[78],"orientation-consistent":[79],"local":[80,105],"features.":[81],"Moreover,":[82],"introduce":[84],"Parallel":[86],"Strip":[87,117],"Convolution":[88],"Module":[89,127,133,139],"(PSCM)":[90],"employing":[91],"horizontal":[92],"vertical":[94],"strip":[95],"adaptively":[98],"enlarge":[99],"receptive":[101],"field":[102],"strengthen":[104],"feature":[106],"modeling":[107],"elongated":[109],"Finally,":[113],"design":[115],"Network":[120],"(StripFPN)":[121],"composed":[122],"Bottom-Up":[125],"Reflow":[126],"(Bottom-Up":[128],"RM),":[129],"Strip-Based":[131],"Enhancement":[132],"(SBEM),":[134],"Self-Attention":[137],"Excitation":[138],"(SAEM)":[140],"achieve":[142],"direction-consistent":[143],"cross-scale":[144],"fusion.":[145],"Experiments":[146],"on":[147],"DOTA-v1.5":[149],"dataset":[150],"show":[151],"Strip-ViTAE":[153],"attains":[154],"72.82%":[155],"mAP,":[156],"surpassing":[157],"state-of-the-art":[159],"(SOTA)":[160],"1.35%":[162],"improving":[164],"mAP":[166],"high-aspect-ratio":[168],"objects":[171],"3.20%,":[173],"validating":[174],"effectiveness":[176],"our":[178],"method.":[179]},"counts_by_year":[],"updated_date":"2025-12-11T23:09:37.256380","created_date":"2025-11-19T00:00:00"}
