{"id":"https://openalex.org/W4399169045","doi":"https://doi.org/10.1109/tgrs.2024.3407598","title":"Language Query-Based Transformer With Multiscale Cross-Modal Alignment for Visual Grounding on Remote Sensing Images","display_name":"Language Query-Based Transformer With Multiscale Cross-Modal Alignment for Visual Grounding on Remote Sensing Images","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4399169045","doi":"https://doi.org/10.1109/tgrs.2024.3407598"},"language":"en","primary_location":{"id":"doi:10.1109/tgrs.2024.3407598","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2024.3407598","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101833357","display_name":"Meng Lan","orcid":"https://orcid.org/0000-0002-5555-5076"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210125402","display_name":"Hubei Zhongshan Hospital","ror":"https://ror.org/02xhgjz70","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210125402"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Meng Lan","raw_affiliation_strings":["Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China","Hubei Luojia Laboratory, Wuhan, P. R. China","School of Computer Science, Institute of Artificial Intelligence, Wuhan University, Wuhan, P. R. China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"Hubei Luojia Laboratory, Wuhan, P. R. China","institution_ids":["https://openalex.org/I4210125402","https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Computer Science, Institute of Artificial Intelligence, Wuhan University, Wuhan, P. R. China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084193949","display_name":"Fu Rong","orcid":"https://orcid.org/0009-0007-2980-9697"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210125402","display_name":"Hubei Zhongshan Hospital","ror":"https://ror.org/02xhgjz70","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210125402"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fu Rong","raw_affiliation_strings":["Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China","School of Computer Science, Institute of Artificial Intelligence, Wuhan University, Wuhan, P. R. China","Hubei Luojia Laboratory, Wuhan, P. R. China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Computer Science, Institute of Artificial Intelligence, Wuhan University, Wuhan, P. R. China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"Hubei Luojia Laboratory, Wuhan, P. R. China","institution_ids":["https://openalex.org/I4210125402","https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026145013","display_name":"Hongzan Jiao","orcid":"https://orcid.org/0000-0002-7048-3293"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongzan Jiao","raw_affiliation_strings":["School of Urban Design, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Urban Design, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084683976","display_name":"Zhi Gao","orcid":"https://orcid.org/0000-0003-3325-1183"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhi Gao","raw_affiliation_strings":["School of Remote Sensing and Information Engineering, Wuhan University, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Remote Sensing and Information Engineering, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024278302","display_name":"Lefei Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210125402","display_name":"Hubei Zhongshan Hospital","ror":"https://ror.org/02xhgjz70","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210125402"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lefei Zhang","raw_affiliation_strings":["Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China","Hubei Luojia Laboratory, Wuhan, P. R. China","School of Computer Science, Institute of Artificial Intelligence, Wuhan University, Wuhan, P. R. China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, School of Computer Science, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"Hubei Luojia Laboratory, Wuhan, P. R. China","institution_ids":["https://openalex.org/I4210125402","https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Computer Science, Institute of Artificial Intelligence, Wuhan University, Wuhan, P. R. China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101833357"],"corresponding_institution_ids":["https://openalex.org/I37461747","https://openalex.org/I4210125402"],"apc_list":null,"apc_paid":null,"fwci":55.0639,"has_fulltext":false,"cited_by_count":28,"citation_normalized_percentile":{"value":0.99855419,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"62","issue":null,"first_page":"1","last_page":"13"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10757","display_name":"Geographic Information Systems Studies","score":0.9724000096321106,"subfield":{"id":"https://openalex.org/subfields/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10757","display_name":"Geographic Information Systems Studies","score":0.9724000096321106,"subfield":{"id":"https://openalex.org/subfields/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9526000022888184,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9301000237464905,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7051544785499573},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6357623338699341},{"id":"https://openalex.org/keywords/ground","display_name":"Ground","score":0.6157678961753845},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.6088228225708008},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.51596599817276},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.45091938972473145},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.38899877667427063},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.385514497756958},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.18846291303634644},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.18534091114997864},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.17122295498847961},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12161111831665039},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.0865328311920166}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7051544785499573},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6357623338699341},{"id":"https://openalex.org/C168993435","wikidata":"https://www.wikidata.org/wiki/Q6501125","display_name":"Ground","level":2,"score":0.6157678961753845},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.6088228225708008},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.51596599817276},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.45091938972473145},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.38899877667427063},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.385514497756958},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.18846291303634644},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.18534091114997864},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.17122295498847961},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12161111831665039},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0865328311920166},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tgrs.2024.3407598","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2024.3407598","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2131151903","display_name":null,"funder_award_id":"42192580","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4308293926","display_name":null,"funder_award_id":"42192583","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7684016204","display_name":null,"funder_award_id":"62122060","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2779054585","https://openalex.org/W2896457183","https://openalex.org/W2962764817","https://openalex.org/W2962766617","https://openalex.org/W2963351448","https://openalex.org/W2963735856","https://openalex.org/W2964345792","https://openalex.org/W2973030851","https://openalex.org/W2983358816","https://openalex.org/W2986803748","https://openalex.org/W2987734933","https://openalex.org/W2992240579","https://openalex.org/W3006154882","https://openalex.org/W3034772468","https://openalex.org/W3035268124","https://openalex.org/W3096609285","https://openalex.org/W3100245404","https://openalex.org/W3110435696","https://openalex.org/W3122239467","https://openalex.org/W3163747765","https://openalex.org/W3174004334","https://openalex.org/W3195858154","https://openalex.org/W3203608457","https://openalex.org/W4200631575","https://openalex.org/W4210820868","https://openalex.org/W4214490042","https://openalex.org/W4225630686","https://openalex.org/W4283029876","https://openalex.org/W4304084012","https://openalex.org/W4312351586","https://openalex.org/W4313021481","https://openalex.org/W4313136325","https://openalex.org/W4313145013","https://openalex.org/W4321021750","https://openalex.org/W4322707256","https://openalex.org/W4382461844","https://openalex.org/W4384009247","https://openalex.org/W4384820618","https://openalex.org/W4385245566","https://openalex.org/W4387350510","https://openalex.org/W4387717533","https://openalex.org/W4391305855","https://openalex.org/W4391953355","https://openalex.org/W6784094891"],"related_works":["https://openalex.org/W2021787609","https://openalex.org/W2097328689","https://openalex.org/W4234899305","https://openalex.org/W1537063595","https://openalex.org/W2379604501","https://openalex.org/W2373854414","https://openalex.org/W2522183581","https://openalex.org/W2954371137","https://openalex.org/W2139939267","https://openalex.org/W1974511032"],"abstract_inverted_index":{"Visual":[0],"grounding":[1],"for":[2,47,87,133],"remote":[3,15,195],"sensing":[4,16,196],"images":[5,18,197],"(RSVG)":[6],"aims":[7],"to":[8,20,27,42,57,105,152,169,184],"localize":[9],"the":[10,14,60,67,72,94,100,112,116,121,149,154,158,165,186,189,214],"referred":[11,64,113,138],"objects":[12],"in":[13,75,120],"(RS)":[17],"according":[19],"a":[21,39,44,80,141,176],"language":[22,82,103,125],"expression.":[23],"Existing":[24],"methods":[25,216],"tend":[26],"align":[28],"visual":[29,118,159],"and":[30,36,107,160,217,223],"text":[31,97,161],"features":[32,98,119],"followed":[33],"by":[34,71],"concatenation":[35],"then":[37,128],"employ":[38],"fusion":[40,53],"Transformer":[41,54,85,122,151],"learn":[43,59],"token":[45],"representation":[46,62,109],"final":[48,134],"target":[49],"localization.":[50],"However,":[51],"simple":[52],"structure":[55],"fails":[56],"sufficiently":[58],"location":[61],"of":[63,111,137,188],"object":[65,114,131,173],"from":[66,115],"multi-modal":[68],"features.":[69],"Inspired":[70],"detection":[73],"Transformer,":[74],"this":[76],"paper,":[77],"we":[78,92],"propose":[79],"novel":[81],"query":[83],"based":[84],"framework":[86],"RSVG":[88,178,190],"termed":[89],"LQVG.":[90],"Specifically,":[91],"adopt":[93],"extracted":[95],"sentence-level":[96],"as":[99],"queries,":[101,104],"called":[102],"retrieve":[106],"aggregate":[108],"information":[110],"multi-scale":[117,142],"decoder.":[123],"The":[124,221],"queries":[126],"are":[127,225],"converted":[129],"into":[130],"embeddings":[132],"coordinate":[135],"prediction":[136],"object.":[139],"Besides,":[140],"cross-modal":[143,166],"alignment":[144],"module":[145],"is":[146,182],"devised":[147],"before":[148],"multimodal":[150],"enhance":[153],"semantic":[155],"correlation":[156],"between":[157],"features,":[162],"thus":[163],"facilitating":[164],"decoding":[167],"process":[168],"generate":[170],"more":[171],"precise":[172],"representation.":[174],"Moreover,":[175],"new":[177],"dataset":[179,222],"named":[180],"RSVG-HR":[181],"built":[183],"evaluate":[185],"performance":[187],"approaches":[191],"on":[192,203],"very":[193],"high-resolution":[194],"with":[198],"inconspicuous":[199],"objects.":[200],"Experimental":[201],"results":[202],"two":[204],"benchmark":[205],"datasets":[206],"demonstrate":[207],"that":[208],"our":[209],"proposed":[210],"method":[211],"significantly":[212],"surpasses":[213],"comparison":[215],"achieves":[218],"state-of-the-art":[219],"performance.":[220],"code":[224],"available":[226],"at":[227],"https://github.com/LANMNG/LQVG.":[228]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":25},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-10-10T00:00:00"}
