{"id":"https://openalex.org/W4386472879","doi":"https://doi.org/10.1109/tgrs.2023.3312479","title":"Multistep Question-Driven Visual Question Answering for Remote Sensing","display_name":"Multistep Question-Driven Visual Question Answering for Remote Sensing","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4386472879","doi":"https://doi.org/10.1109/tgrs.2023.3312479"},"language":"en","primary_location":{"id":"doi:10.1109/tgrs.2023.3312479","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2023.3312479","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042379417","display_name":"Meimei Zhang","orcid":"https://orcid.org/0000-0001-9621-4879"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]},{"id":"https://openalex.org/I4210137199","display_name":"Aerospace Information Research Institute","ror":"https://ror.org/0419fj215","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210137199"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Meimei Zhang","raw_affiliation_strings":["International Research Center of Big Data for Sustainable Development Goals, Beijing, China","Aerospace Information Research Institute, Key Laboratory of Digital Earth Science, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-9621-4879","affiliations":[{"raw_affiliation_string":"International Research Center of Big Data for Sustainable Development Goals, Beijing, China","institution_ids":["https://openalex.org/I4210096250"]},{"raw_affiliation_string":"Aerospace Information Research Institute, Key Laboratory of Digital Earth Science, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210137199","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Fang Chen","orcid":"https://orcid.org/0000-0002-3245-2584"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]},{"id":"https://openalex.org/I4210137199","display_name":"Aerospace Information Research Institute","ror":"https://ror.org/0419fj215","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210137199"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fang Chen","raw_affiliation_strings":["International Research Center of Big Data for Sustainable Development Goals, Beijing, China","Aerospace Information Research Institute, Key Laboratory of Digital Earth Science, Chinese Academy of Sciences, Beijing, China","University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3245-2584","affiliations":[{"raw_affiliation_string":"International Research Center of Big Data for Sustainable Development Goals, Beijing, China","institution_ids":["https://openalex.org/I4210096250"]},{"raw_affiliation_string":"Aerospace Information Research Institute, Key Laboratory of Digital Earth Science, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210137199","https://openalex.org/I19820366"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100365212","display_name":"Bin Li","orcid":"https://orcid.org/0000-0002-7774-5452"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]},{"id":"https://openalex.org/I4210137199","display_name":"Aerospace Information Research Institute","ror":"https://ror.org/0419fj215","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210137199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Li","raw_affiliation_strings":["International Research Center of Big Data for Sustainable Development Goals, Beijing, China","Aerospace Information Research Institute, Key Laboratory of Digital Earth Science, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Research Center of Big Data for Sustainable Development Goals, Beijing, China","institution_ids":["https://openalex.org/I4210096250"]},{"raw_affiliation_string":"Aerospace Information Research Institute, Key Laboratory of Digital Earth Science, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210137199","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5042379417"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210096250","https://openalex.org/I4210137199"],"apc_list":null,"apc_paid":null,"fwci":3.0614,"has_fulltext":false,"cited_by_count":26,"citation_normalized_percentile":{"value":0.93279998,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"61","issue":null,"first_page":"1","last_page":"12"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8529568910598755},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.8030760884284973},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6156153678894043},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.598535418510437},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5442502498626709},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.5374122262001038},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.416128009557724},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3129006028175354}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8529568910598755},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.8030760884284973},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6156153678894043},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.598535418510437},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5442502498626709},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.5374122262001038},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.416128009557724},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3129006028175354},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tgrs.2023.3312479","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tgrs.2023.3312479","pdf_url":null,"source":{"id":"https://openalex.org/S111326731","display_name":"IEEE Transactions on Geoscience and Remote Sensing","issn_l":"0196-2892","issn":["0196-2892","1558-0644"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Geoscience and Remote Sensing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1933349210","https://openalex.org/W2004808590","https://openalex.org/W2189070436","https://openalex.org/W2194775991","https://openalex.org/W2442626797","https://openalex.org/W2463565445","https://openalex.org/W2501377452","https://openalex.org/W2515866431","https://openalex.org/W2560730294","https://openalex.org/W2608030593","https://openalex.org/W2745461083","https://openalex.org/W2799150641","https://openalex.org/W2803259101","https://openalex.org/W2899012231","https://openalex.org/W2947312908","https://openalex.org/W2962749469","https://openalex.org/W2963012286","https://openalex.org/W2963163163","https://openalex.org/W2963191264","https://openalex.org/W2963383024","https://openalex.org/W2963521239","https://openalex.org/W2963717374","https://openalex.org/W2963954913","https://openalex.org/W2963991868","https://openalex.org/W2964072591","https://openalex.org/W2966683369","https://openalex.org/W2981694290","https://openalex.org/W2986685865","https://openalex.org/W2988326850","https://openalex.org/W3002557610","https://openalex.org/W3004349648","https://openalex.org/W3007556011","https://openalex.org/W3012111773","https://openalex.org/W3035517717","https://openalex.org/W3035644209","https://openalex.org/W3047246571","https://openalex.org/W3098351727","https://openalex.org/W3105577662","https://openalex.org/W3108512475","https://openalex.org/W3109072389","https://openalex.org/W3165058054","https://openalex.org/W3168972675","https://openalex.org/W3171312896","https://openalex.org/W3175205795","https://openalex.org/W3188086824","https://openalex.org/W3203031838","https://openalex.org/W4225991573","https://openalex.org/W4229439310","https://openalex.org/W4285034333","https://openalex.org/W4287214436","https://openalex.org/W4307439181","https://openalex.org/W4362470605","https://openalex.org/W4362637732","https://openalex.org/W6637373629","https://openalex.org/W6686883664","https://openalex.org/W6719057275","https://openalex.org/W6736769356","https://openalex.org/W6752083267","https://openalex.org/W6786450884","https://openalex.org/W6789155089","https://openalex.org/W6796729313","https://openalex.org/W6802006682","https://openalex.org/W6810294919"],"related_works":["https://openalex.org/W2366107444","https://openalex.org/W2384605597","https://openalex.org/W2378211422","https://openalex.org/W4388145910","https://openalex.org/W1976205134","https://openalex.org/W2381570729","https://openalex.org/W2745001401","https://openalex.org/W4248336175","https://openalex.org/W2387743295","https://openalex.org/W4321353415"],"abstract_inverted_index":{"Visual":[0],"question":[1,132,165],"answering":[2],"(VQA)":[3],"aims":[4],"to":[5,15,101,113],"build":[6,125],"an":[7,83],"interactive":[8],"system":[9,89],"that":[10,109,129,187,202],"infers":[11],"the":[12,16,53,71,76,107,114,118,131,140,164,188,212],"answer":[13],"according":[14],"input":[17],"image":[18,143],"and":[19,35,41,55,74,104,134,171,183,210,216,221],"text-based":[20],"question.":[21,115],"Recently,":[22],"VQA":[23,87,160,196],"for":[24,37,52,90],"remote":[25,63,91,158,174,194],"sensing":[26,64,159,175,195],"has":[27,204],"attracted":[28],"considerable":[29],"attention":[30,99],"since":[31],"it":[32],"is":[33,50,59,110,166],"essential":[34],"expedient":[36],"monitoring":[38],"global":[39],"resources":[40],"querying":[42],"objective":[43],"attributes.":[44],"In":[45,93],"reality,":[46],"question-related":[47],"semantic":[48,119],"information":[49,73,120],"helpful":[51],"reasoning":[54,209],"understanding":[56,211],"capabilities,":[57],"which":[58,136],"always":[60],"contained":[61],"in":[62,121,146,168,208],"images":[65,215],"or":[66],"complex":[67,122,157,169,217],"questions.":[68,218],"To":[69,116,149],"capture":[70],"valuable":[72],"extend":[75],"applications":[77],"of":[78,142],"remote-sensing":[79],"VQA,":[80],"we":[81,95,124,153],"propose":[82],"end-to-end":[84],"multiple-step":[85,98],"question-driven":[86,127],"(MQVQA)":[88],"sensing.":[92],"MQVQA,":[94],"employ":[96],"a":[97,126,155,205],"mechanism":[100],"interactively":[102],"reason":[103],"concomitantly":[105],"mark":[106],"region":[108],"most":[111],"related":[112],"understand":[117],"questions,":[123],"module":[128],"classifies":[130],"types":[133],"keywords,":[135],"will":[137],"further":[138],"guide":[139],"combination":[141],"feature":[144],"maps":[145],"different":[147],"scales.":[148],"benchmark":[150],"this":[151],"model,":[152],"construct":[154],"new":[156],"dataset":[161,222],"(CRSVQA),":[162],"wherein":[163],"asked":[167],"forms":[170],"involves":[172],"various":[173],"scenes.":[176],"The":[177,198],"evaluation":[178],"results":[179,200],"on":[180],"CRSVQA,":[181],"RSVQA":[182],"RSIVQA":[184],"datasets":[185],"indicate":[186],"proposed":[189],"MQVQA":[190,203],"model":[191],"surpasses":[192],"other":[193],"models.":[197],"visualization":[199],"demonstrate":[201],"robust":[206],"ability":[207],"content":[213],"from":[214],"Our":[219],"code":[220],"are":[223],"publicly":[224],"available":[225],"at:":[226],"https://github.com/MeimeiZhang-data/MQVQA.":[227]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":17},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
