{"id":"https://openalex.org/W4313055764","doi":"https://doi.org/10.1109/igarss46834.2022.9883252","title":"Multi-Scale Interactive Transformer for Remote Sensing Cross-Modal Image-Text Retrieval","display_name":"Multi-Scale Interactive Transformer for Remote Sensing Cross-Modal Image-Text Retrieval","publication_year":2022,"publication_date":"2022-07-17","ids":{"openalex":"https://openalex.org/W4313055764","doi":"https://doi.org/10.1109/igarss46834.2022.9883252"},"language":"en","primary_location":{"id":"doi:10.1109/igarss46834.2022.9883252","is_oa":false,"landing_page_url":"https://doi.org/10.1109/igarss46834.2022.9883252","pdf_url":null,"source":{"id":"https://openalex.org/S4363604196","display_name":"IGARSS 2022 - 2022 IEEE International Geoscience and Remote Sensing Symposium","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IGARSS 2022 - 2022 IEEE International Geoscience and Remote Sensing Symposium","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100780978","display_name":"Yijing Wang","orcid":"https://orcid.org/0000-0002-0862-6564"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yijing Wang","raw_affiliation_strings":["School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","Geovis Spatial Technology Co.,Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","institution_ids":["https://openalex.org/I149594827"]},{"raw_affiliation_string":"Geovis Spatial Technology Co.,Ltd","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101449769","display_name":"Jingjing Ma","orcid":"https://orcid.org/0000-0001-7562-4262"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingjing Ma","raw_affiliation_strings":["School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","Geovis Spatial Technology Co.,Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","institution_ids":["https://openalex.org/I149594827"]},{"raw_affiliation_string":"Geovis Spatial Technology Co.,Ltd","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012061890","display_name":"Mingteng Li","orcid":"https://orcid.org/0000-0001-8866-0828"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingteng Li","raw_affiliation_strings":["School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","Geovis Spatial Technology Co.,Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","institution_ids":["https://openalex.org/I149594827"]},{"raw_affiliation_string":"Geovis Spatial Technology Co.,Ltd","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059262797","display_name":"Xu Tang","orcid":"https://orcid.org/0000-0003-1375-0778"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Tang","raw_affiliation_strings":["School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","Geovis Spatial Technology Co.,Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","institution_ids":["https://openalex.org/I149594827"]},{"raw_affiliation_string":"Geovis Spatial Technology Co.,Ltd","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101609203","display_name":"Xiao Han","orcid":"https://orcid.org/0000-0002-1953-8658"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Han","raw_affiliation_strings":["School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","Geovis Spatial Technology Co.,Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","institution_ids":["https://openalex.org/I149594827"]},{"raw_affiliation_string":"Geovis Spatial Technology Co.,Ltd","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050630882","display_name":"Licheng Jiao","orcid":"https://orcid.org/0000-0003-3354-9617"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Licheng Jiao","raw_affiliation_strings":["School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","Geovis Spatial Technology Co.,Ltd"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Xidian University,Xi&#x0027;an,Shaanxi Province,China,710071","institution_ids":["https://openalex.org/I149594827"]},{"raw_affiliation_string":"Geovis Spatial Technology Co.,Ltd","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.2387,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.8649819,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"839","last_page":"842"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8060240745544434},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.7127705812454224},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.7103118896484375},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.568790078163147},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5685498714447021},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5193518400192261},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5061444640159607},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4705629348754883},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4221609830856323},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4173007011413574},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4164566099643707},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09836354851722717}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8060240745544434},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.7127705812454224},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.7103118896484375},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.568790078163147},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5685498714447021},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5193518400192261},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5061444640159607},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4705629348754883},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4221609830856323},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4173007011413574},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4164566099643707},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09836354851722717},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/igarss46834.2022.9883252","is_oa":false,"landing_page_url":"https://doi.org/10.1109/igarss46834.2022.9883252","pdf_url":null,"source":{"id":"https://openalex.org/S4363604196","display_name":"IGARSS 2022 - 2022 IEEE International Geoscience and Remote Sensing Symposium","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IGARSS 2022 - 2022 IEEE International Geoscience and Remote Sensing Symposium","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6800000071525574}],"awards":[{"id":"https://openalex.org/G5324547038","display_name":null,"funder_award_id":"62171332","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1555459384","https://openalex.org/W2131774270","https://openalex.org/W2183341477","https://openalex.org/W2531409750","https://openalex.org/W2774267535","https://openalex.org/W2779054585","https://openalex.org/W2886702754","https://openalex.org/W2896457183","https://openalex.org/W2963840672","https://openalex.org/W3042481550","https://openalex.org/W3100245404","https://openalex.org/W3126792443","https://openalex.org/W3140792177","https://openalex.org/W3165084071","https://openalex.org/W3208803664","https://openalex.org/W4205723298","https://openalex.org/W4385245566","https://openalex.org/W6696085341","https://openalex.org/W6728184133","https://openalex.org/W6755207826","https://openalex.org/W6789753369","https://openalex.org/W6796339025","https://openalex.org/W6802704712"],"related_works":["https://openalex.org/W4390516098","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W2142795561","https://openalex.org/W4205302943","https://openalex.org/W2561132942","https://openalex.org/W3155418658","https://openalex.org/W4243199227","https://openalex.org/W2379948177","https://openalex.org/W4309346246"],"abstract_inverted_index":{"Cross-modal":[0],"Remote":[1],"sensing":[2],"(RS)":[3],"image-text":[4],"retrieval":[5,178],"(CMR-SITR)":[6],"plays":[7],"a":[8,88,140],"crucial":[9],"role":[10],"in":[11,35,62,93],"the":[12,36,45,69,82,116,133,160,177],"RS":[13,25,111,154,169,186],"community.":[14],"A":[15],"common":[16,39],"way":[17],"for":[18,91,108,166,193],"CMRSITR":[19,92],"is":[20,119,146,191],"to":[21,127,148,175],"extract":[22],"texts":[23,109,167],"and":[24,30,59,75,110,168],"images'":[26],"feature":[27,40,105,143],"representations":[28],"separately":[29],"then":[31],"measure":[32],"their":[33,63],"similarities":[34],"specific":[37],"or":[38],"space.":[41],"Recently,":[42],"along":[43],"with":[44],"booming":[46],"of":[47,55,158],"deep":[48],"convolutional":[49],"neural":[50],"networks":[51],"(DCNNs),":[52],"these":[53],"kinds":[54],"methods":[56],"are":[57,77],"vivid":[58],"achieve":[60],"successes":[61],"own":[64],"applications.":[65],"However,":[66],"they":[67,76],"neglect":[68],"inherent":[70],"relationships":[71],"between":[72,136],"different":[73,137],"features,":[74,161],"always":[78],"heavy.":[79,121],"To":[80],"overcome":[81],"limitations":[83],"mentioned":[84],"above,":[85],"we":[86],"propose":[87],"new":[89],"model":[90,118],"this":[94],"paper,":[95],"named":[96],"multi-scale":[97,142],"interactive":[98],"transformer":[99,125],"(MSIT).":[100],"MSIT":[101,123,162],"first":[102],"adopts":[103],"simple":[104],"learning":[106,144],"models":[107],"images":[112],"which":[113,171],"could":[114],"ensure":[115],"whole":[117],"not":[120],"Then,":[122],"introduces":[124],"encoders":[126],"enhance":[128],"features'":[129],"usefulness":[130],"by":[131],"considering":[132],"potential":[134],"relations":[135],"representations.":[138],"Also,":[139],"lightweight":[141],"module":[145],"proposed":[147],"mine":[149],"more":[150],"plentiful":[151],"contents":[152],"from":[153],"images.":[155],"Finally,":[156],"instead":[157],"outputting":[159],"produces":[163],"matching":[164],"scores":[165],"images,":[170],"can":[172],"be":[173],"used":[174],"decide":[176],"results":[179,183],"directly.":[180],"The":[181],"experimental":[182],"on":[184],"two":[185],"datasets":[187],"indicate":[188],"our":[189],"modal":[190],"effective":[192],"CMRSITR.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":5}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
