{"id":"https://openalex.org/W4402265914","doi":"https://doi.org/10.1109/igarss53475.2024.10642082","title":"Segmentation-Guided Attention for Visual Question Answering from Remote Sensing Images","display_name":"Segmentation-Guided Attention for Visual Question Answering from Remote Sensing Images","publication_year":2024,"publication_date":"2024-07-07","ids":{"openalex":"https://openalex.org/W4402265914","doi":"https://doi.org/10.1109/igarss53475.2024.10642082"},"language":"en","primary_location":{"id":"doi:10.1109/igarss53475.2024.10642082","is_oa":false,"landing_page_url":"https://doi.org/10.1109/igarss53475.2024.10642082","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IGARSS 2024 - 2024 IEEE International Geoscience and Remote Sensing Symposium","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093093945","display_name":"Lucrezia Tosato","orcid":null},"institutions":[{"id":"https://openalex.org/I4210091437","display_name":"Sorbonne Paris Cit\u00e9","ror":"https://ror.org/001z21q04","country_code":"FR","type":"other","lineage":["https://openalex.org/I4210091437"]},{"id":"https://openalex.org/I4403386760","display_name":"Laboratoire Informatique Paris Descartes","ror":"https://ror.org/04s80ef73","country_code":"FR","type":"facility","lineage":["https://openalex.org/I204730241","https://openalex.org/I4403386760"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Lucrezia Tosato","raw_affiliation_strings":["Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006","institution_ids":["https://openalex.org/I4210091437","https://openalex.org/I4403386760"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104453423","display_name":"Hichem Boussaid","orcid":null},"institutions":[{"id":"https://openalex.org/I4210091437","display_name":"Sorbonne Paris Cit\u00e9","ror":"https://ror.org/001z21q04","country_code":"FR","type":"other","lineage":["https://openalex.org/I4210091437"]},{"id":"https://openalex.org/I4403386760","display_name":"Laboratoire Informatique Paris Descartes","ror":"https://ror.org/04s80ef73","country_code":"FR","type":"facility","lineage":["https://openalex.org/I204730241","https://openalex.org/I4403386760"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Hichem Boussaid","raw_affiliation_strings":["Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006","institution_ids":["https://openalex.org/I4210091437","https://openalex.org/I4403386760"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034942073","display_name":"Flora Weissgerber","orcid":"https://orcid.org/0000-0003-2662-552X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Flora Weissgerber","raw_affiliation_strings":["Universit&#x00E9; Paris Saclay,DTIS, ONERA,Palaiseau,France,FR-91123"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; Paris Saclay,DTIS, ONERA,Palaiseau,France,FR-91123","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090167453","display_name":"Camille Kurtz","orcid":"https://orcid.org/0000-0001-9254-7537"},"institutions":[{"id":"https://openalex.org/I4210091437","display_name":"Sorbonne Paris Cit\u00e9","ror":"https://ror.org/001z21q04","country_code":"FR","type":"other","lineage":["https://openalex.org/I4210091437"]},{"id":"https://openalex.org/I4403386760","display_name":"Laboratoire Informatique Paris Descartes","ror":"https://ror.org/04s80ef73","country_code":"FR","type":"facility","lineage":["https://openalex.org/I204730241","https://openalex.org/I4403386760"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Camille Kurtz","raw_affiliation_strings":["Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006","institution_ids":["https://openalex.org/I4210091437","https://openalex.org/I4403386760"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080615669","display_name":"Laurent Wendling","orcid":"https://orcid.org/0000-0003-1091-5995"},"institutions":[{"id":"https://openalex.org/I4210091437","display_name":"Sorbonne Paris Cit\u00e9","ror":"https://ror.org/001z21q04","country_code":"FR","type":"other","lineage":["https://openalex.org/I4210091437"]},{"id":"https://openalex.org/I4403386760","display_name":"Laboratoire Informatique Paris Descartes","ror":"https://ror.org/04s80ef73","country_code":"FR","type":"facility","lineage":["https://openalex.org/I204730241","https://openalex.org/I4403386760"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Laurent Wendling","raw_affiliation_strings":["Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006","institution_ids":["https://openalex.org/I4210091437","https://openalex.org/I4403386760"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087677326","display_name":"Sylvain Lobry","orcid":"https://orcid.org/0000-0003-4738-2416"},"institutions":[{"id":"https://openalex.org/I4210091437","display_name":"Sorbonne Paris Cit\u00e9","ror":"https://ror.org/001z21q04","country_code":"FR","type":"other","lineage":["https://openalex.org/I4210091437"]},{"id":"https://openalex.org/I4403386760","display_name":"Laboratoire Informatique Paris Descartes","ror":"https://ror.org/04s80ef73","country_code":"FR","type":"facility","lineage":["https://openalex.org/I204730241","https://openalex.org/I4403386760"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Sylvain Lobry","raw_affiliation_strings":["Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; Paris Cite,LIPADE,Paris,France,75006","institution_ids":["https://openalex.org/I4210091437","https://openalex.org/I4403386760"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5093093945"],"corresponding_institution_ids":["https://openalex.org/I4210091437","https://openalex.org/I4403386760"],"apc_list":null,"apc_paid":null,"fwci":1.6935,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.85552138,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2750","last_page":"2754"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7246337532997131},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6472333669662476},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.5886998176574707},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5532292723655701},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5456734895706177},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.544135332107544},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3249611258506775}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7246337532997131},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6472333669662476},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.5886998176574707},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5532292723655701},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5456734895706177},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.544135332107544},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3249611258506775}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/igarss53475.2024.10642082","is_oa":false,"landing_page_url":"https://doi.org/10.1109/igarss53475.2024.10642082","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IGARSS 2024 - 2024 IEEE International Geoscience and Remote Sensing Symposium","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-04809734v1","is_oa":false,"landing_page_url":"https://hal.science/hal-04809734","pdf_url":null,"source":{"id":"https://openalex.org/S4406922461","display_name":"SPIRE - Sciences Po Institutional REpository","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IGARSS 2024 - 2024 IEEE International Geoscience and Remote Sensing Symposium, Jul 2024, Ath\u00e8nes, Greece. pp.2750-2754, &#x27E8;10.1109/IGARSS53475.2024.10642082&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1566289585","https://openalex.org/W1933349210","https://openalex.org/W2194775991","https://openalex.org/W2507296351","https://openalex.org/W2944418962","https://openalex.org/W2963705779","https://openalex.org/W2973009097","https://openalex.org/W2978017171","https://openalex.org/W2983550634","https://openalex.org/W3012111773","https://openalex.org/W3035552787","https://openalex.org/W3035588244","https://openalex.org/W3098351727","https://openalex.org/W3138516171","https://openalex.org/W3168972675","https://openalex.org/W4292828962","https://openalex.org/W4307321662","https://openalex.org/W4312719951","https://openalex.org/W4389156953","https://openalex.org/W4390873086","https://openalex.org/W6768851824","https://openalex.org/W6858452920"],"related_works":["https://openalex.org/W2384605597","https://openalex.org/W2387743295","https://openalex.org/W3082787378","https://openalex.org/W2136007095","https://openalex.org/W2366230879","https://openalex.org/W3208425359","https://openalex.org/W2349927912","https://openalex.org/W3159777597","https://openalex.org/W4212839359","https://openalex.org/W1522196789"],"abstract_inverted_index":{"Visual":[0],"Question":[1],"Answering":[2],"for":[3,64],"Remote":[4],"Sensing":[5],"(RSVQA)":[6],"is":[7,29],"a":[8,21,35,65,82,90,98,118,153],"task":[9],"that":[10,87,122],"aims":[11],"at":[12],"answering":[13],"natural":[14],"language":[15],"questions":[16],"about":[17],"the":[18,47,56,59,102,157],"content":[19],"of":[20,55,101,110,141,148],"remote":[22],"sensing":[23],"image.":[24],"The":[25],"visual":[26,62,103],"features":[27],"extraction":[28],"therefore":[30],"an":[31,75],"essential":[32],"step":[33],"in":[34,93],"VQA":[36,120],"pipeline.":[37,84],"By":[38],"incorporating":[39],"attention":[40,76,95],"mechanisms":[41],"into":[42,81],"this":[43,69,114],"process,":[44],"models":[45],"gain":[46],"ability":[48],"to":[49,73,152],"focus":[50],"selectively":[51],"on":[52,156],"salient":[53],"regions":[54],"image,":[57],"prioritizing":[58],"most":[60],"relevant":[61],"information":[63],"given":[66],"question.":[67],"In":[68],"work,":[70],"we":[71,116],"propose":[72],"embed":[74],"mechanism":[77],"guided":[78],"by":[79,96],"segmentation":[80,88,131],"RSVQA":[83],"We":[85],"argue":[86],"plays":[89],"crucial":[91],"role":[92],"guiding":[94],"providing":[97],"contextual":[99],"understanding":[100],"information,":[104],"underlying":[105],"specific":[106],"objects":[107],"or":[108],"areas":[109],"interest.":[111],"To":[112],"evaluate":[113],"methodology,":[115,144],"provide":[117],"new":[119,143],"dataset":[121],"exploits":[123],"very":[124],"high-resolution":[125],"RGB":[126],"orthophotos":[127],"annotated":[128],"with":[129],"16":[130],"classes":[132],"and":[133],"question/answer":[134],"pairs.":[135],"Our":[136],"study":[137],"shows":[138],"promising":[139],"results":[140],"our":[142],"gaining":[145],"almost":[146],"10%":[147],"overall":[149],"accuracy":[150],"compared":[151],"classical":[154],"method":[155],"proposed":[158],"dataset.":[159]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":5}],"updated_date":"2026-04-17T18:11:37.981687","created_date":"2025-10-10T00:00:00"}
