{"id":"https://openalex.org/W4383220186","doi":"https://doi.org/10.1109/tgrs.2023.3292418","title":"Efficient Inductive Vision Transformer for Oriented Object Detection in Remote Sensing Imagery","display_name":"Efficient Inductive Vision Transformer for Oriented Object Detection in Remote Sensing Imagery","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4383220186","doi":"https://doi.org/10.1109/tgrs.2023.3292418"},"language":"en","primary_location":{"id":"doi:10.1109/tgrs.2023.3292418","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2023.3292418","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101776528","display_name":"Cong Zhang","orcid":"https://orcid.org/0000-0003-2745-1656"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Cong Zhang","raw_affiliation_strings":["Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072056125","display_name":"Jingran Su","orcid":"https://orcid.org/0000-0002-9873-1770"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jingran Su","raw_affiliation_strings":["Department of Computing, The Hong Kong Polytechnic University, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computing, The Hong Kong Polytechnic University, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086183661","display_name":"Yakun Ju","orcid":"https://orcid.org/0000-0003-4065-4108"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yakun Ju","raw_affiliation_strings":["Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019678322","display_name":"Kin\u2010Man Lam","orcid":"https://orcid.org/0000-0002-0422-8454"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Kin-Man Lam","raw_affiliation_strings":["Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Electronic and Information Engineering, The Hong Kong Polytechnic University, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100341321","display_name":"Qi Wang","orcid":"https://orcid.org/0000-0002-7028-4956"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Wang","raw_affiliation_strings":["School of Artificial Intelligence, Optics and Electronics, Northwestern Polytechnical University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Optics and Electronics, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101776528"],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":17.4252,"has_fulltext":false,"cited_by_count":110,"citation_normalized_percentile":{"value":0.99442666,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"61","issue":null,"first_page":"1","last_page":"20"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8246523141860962},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5670909285545349},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5567196607589722},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4853443205356598},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.48339739441871643},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.48191526532173157},{"id":"https://openalex.org/keywords/remote-sensing-application","display_name":"Remote sensing application","score":0.428529292345047},{"id":"https://openalex.org/keywords/inductive-bias","display_name":"Inductive bias","score":0.4129106402397156},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.2727915942668915},{"id":"https://openalex.org/keywords/hyperspectral-imaging","display_name":"Hyperspectral imaging","score":0.25419604778289795},{"id":"https://openalex.org/keywords/multi-task-learning","display_name":"Multi-task learning","score":0.2473912239074707},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.13356590270996094},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.10033464431762695}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8246523141860962},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5670909285545349},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5567196607589722},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4853443205356598},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.48339739441871643},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.48191526532173157},{"id":"https://openalex.org/C183365957","wikidata":"https://www.wikidata.org/wiki/Q17140402","display_name":"Remote sensing application","level":3,"score":0.428529292345047},{"id":"https://openalex.org/C197352929","wikidata":"https://www.wikidata.org/wiki/Q1074074","display_name":"Inductive bias","level":4,"score":0.4129106402397156},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2727915942668915},{"id":"https://openalex.org/C159078339","wikidata":"https://www.wikidata.org/wiki/Q959005","display_name":"Hyperspectral imaging","level":2,"score":0.25419604778289795},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.2473912239074707},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.13356590270996094},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.10033464431762695},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tgrs.2023.3292418","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2023.3292418","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":117,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1536680647","https://openalex.org/W1861492603","https://openalex.org/W2017448754","https://openalex.org/W2037227137","https://openalex.org/W2059497048","https://openalex.org/W2085625911","https://openalex.org/W2100503224","https://openalex.org/W2102605133","https://openalex.org/W2118246710","https://openalex.org/W2194775991","https://openalex.org/W2400429454","https://openalex.org/W2412588858","https://openalex.org/W2547875792","https://openalex.org/W2549139847","https://openalex.org/W2565639579","https://openalex.org/W2597117158","https://openalex.org/W2884275291","https://openalex.org/W2884751099","https://openalex.org/W2896457183","https://openalex.org/W2908510526","https://openalex.org/W2935079508","https://openalex.org/W2941769495","https://openalex.org/W2949058942","https://openalex.org/W2962749812","https://openalex.org/W2962858109","https://openalex.org/W2963037989","https://openalex.org/W2963351448","https://openalex.org/W2963504571","https://openalex.org/W2964979676","https://openalex.org/W2967487473","https://openalex.org/W2973030851","https://openalex.org/W2991359031","https://openalex.org/W2991363140","https://openalex.org/W2995801068","https://openalex.org/W3015331846","https://openalex.org/W3022917557","https://openalex.org/W3030520226","https://openalex.org/W3035422918","https://openalex.org/W3035678286","https://openalex.org/W3046174881","https://openalex.org/W3092088889","https://openalex.org/W3092462694","https://openalex.org/W3109632933","https://openalex.org/W3121842289","https://openalex.org/W3131500599","https://openalex.org/W3133696297","https://openalex.org/W3136761610","https://openalex.org/W3137278571","https://openalex.org/W3138516171","https://openalex.org/W3140922383","https://openalex.org/W3156315514","https://openalex.org/W3157528469","https://openalex.org/W3160694286","https://openalex.org/W3170841864","https://openalex.org/W3170874841","https://openalex.org/W3174873843","https://openalex.org/W3175227919","https://openalex.org/W3176495987","https://openalex.org/W3180045188","https://openalex.org/W3183129439","https://openalex.org/W3186596917","https://openalex.org/W3193551430","https://openalex.org/W3195858154","https://openalex.org/W3200975211","https://openalex.org/W3201260569","https://openalex.org/W3201797941","https://openalex.org/W3203608457","https://openalex.org/W3211585026","https://openalex.org/W3213792864","https://openalex.org/W3213833596","https://openalex.org/W3214586131","https://openalex.org/W4205932092","https://openalex.org/W4207055281","https://openalex.org/W4210925408","https://openalex.org/W4211114389","https://openalex.org/W4211247672","https://openalex.org/W4213450901","https://openalex.org/W4214493665","https://openalex.org/W4214648418","https://openalex.org/W4214893857","https://openalex.org/W4220837851","https://openalex.org/W4225590475","https://openalex.org/W4225630686","https://openalex.org/W4225742096","https://openalex.org/W4226289601","https://openalex.org/W4226361741","https://openalex.org/W4285189202","https://openalex.org/W4290715466","https://openalex.org/W4292971347","https://openalex.org/W4294643360","https://openalex.org/W4294982749","https://openalex.org/W4297775537","https://openalex.org/W4312350143","https://openalex.org/W4312373555","https://openalex.org/W4312711220","https://openalex.org/W4312735552","https://openalex.org/W4312849330","https://openalex.org/W4313039766","https://openalex.org/W4313525589","https://openalex.org/W4319878798","https://openalex.org/W4385245566","https://openalex.org/W6639102338","https://openalex.org/W6729448088","https://openalex.org/W6737664043","https://openalex.org/W6739901393","https://openalex.org/W6755207826","https://openalex.org/W6757817989","https://openalex.org/W6778485988","https://openalex.org/W6784094891","https://openalex.org/W6788135285","https://openalex.org/W6790690058","https://openalex.org/W6794345597","https://openalex.org/W6797235774","https://openalex.org/W6803650990","https://openalex.org/W6803695728","https://openalex.org/W6841254037"],"related_works":["https://openalex.org/W1810370127","https://openalex.org/W4293226380","https://openalex.org/W1594946127","https://openalex.org/W4312273141","https://openalex.org/W4310274968","https://openalex.org/W3040224948","https://openalex.org/W4313906399","https://openalex.org/W1587378402","https://openalex.org/W4321487865","https://openalex.org/W2969228573"],"abstract_inverted_index":{"Object":[0],"detection":[1,130,269],"is":[2,29,125,156,165,204,217],"a":[3,56,118],"fundamental":[4],"task":[5,74],"in":[6,72,103,115,131,152,171,210,232,245,270],"remote":[7,15,76,88,132,153,233,271],"sensing":[8,16,77,89,133,154,234,272],"image":[9],"analysis":[10],"and":[11,68,100,143,159,195,201,224,264],"scene":[12],"understanding.":[13],"Previous":[14],"object":[17,78,129,249,268],"detectors":[18],"are":[19,199,243],"typically":[20],"based":[21],"on":[22,255],"convolutional":[23],"neural":[24],"networks":[25],"(CNNs),":[26],"whose":[27],"performance":[28,69],"significantly":[30],"limited":[31],"by":[32,95],"the":[33,52,66,73,138,177,182,221,239],"intrinsic":[34],"locality":[35],"of":[36,41,70,75,97,108,226],"convolution":[37],"operations.":[38],"The":[39],"emergence":[40],"vision":[42,122],"Transformers":[43,71],"brings":[44],"potential":[45],"solutions":[46],"to":[47,54,59,167,206,219],"this":[48,116,237],"problem,":[49],"which":[50,173],"have":[51,260],"capability":[53],"be":[55],"solid":[57],"alternative":[58],"CNNs.":[60],"However,":[61],"three":[62,241],"crucial":[63],"obstacles":[64],"hinder":[65],"application":[67],"detection,":[79],"i.e.,":[80],"1)":[81,149],"high":[82],"computational":[83,178],"complexity,":[84],"especially":[85],"for":[86,127,229,266],"high-resolution":[87],"images,":[90],"2)":[91,184],"training-and":[92],"sample-inefficiency":[93],"caused":[94],"lack":[96],"inductive":[98,121,208],"bias,":[99],"3)":[101,212],"difficulty":[102],"learning":[104,225],"arbitrary":[105],"orientation":[106],"knowledge":[107,228],"geospatial":[109],"objects.":[110],"To":[111],"address":[112],"these":[113],"issues,":[114],"paper,":[117],"novel":[119],"efficient":[120],"Transformer":[123],"framework":[124,136],"proposed":[126,166,205,218],"oriented":[128,230,267],"imagery.":[134],"This":[135],"follows":[137],"hierarchical":[139],"feature":[140],"pyramid":[141],"structure":[142],"makes":[144],"threefold":[145],"contributions,":[146],"as":[147],"follows.":[148],"Spatial":[150],"redundancy":[151],"images":[155],"fully":[157],"explored":[158],"an":[160,246],"adaptive":[161],"multi-grained":[162],"routing":[163],"mechanism":[164],"facilitate":[168],"token":[169],"sparsity":[170],"Transformers,":[172],"can":[174],"dramatically":[175],"reduce":[176],"cost":[179],"without":[180],"comprising":[181],"accuracy.":[183],"A":[185],"compact":[186],"dual-path":[187],"encoding":[188],"architecture,":[189],"where":[190],"both":[191],"global":[192],"long-range":[193],"dependencies":[194],"local":[196],"semantic":[197],"relations":[198],"jointly":[200],"complementarily":[202],"captured,":[203],"enhance":[207],"bias":[209],"Transformers.":[211],"An":[213],"angle":[214],"tokenization":[215],"technique":[216],"promote":[220],"encoding,":[222],"embedding,":[223],"direction":[227],"objects":[231],"scenarios.":[235],"In":[236],"work,":[238],"above":[240],"contributions":[242],"instantiated":[244],"advanced":[247],"Transformer-based":[248],"detector,":[250],"namely":[251],"EIA-PVT.":[252],"Comprehensive":[253],"experiments":[254],"two":[256],"publicly":[257],"available":[258],"datasets":[259],"demonstrated":[261],"its":[262],"effectiveness":[263],"superiority":[265],"images.":[273]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":50},{"year":2024,"cited_by_count":48},{"year":2023,"cited_by_count":9}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
