{"id":"https://openalex.org/W4404740427","doi":"https://doi.org/10.1109/icbase63199.2024.10762433","title":"Multi-modal Remote Sensing Visual Question Answering Algorithm Based on Large Language Model","display_name":"Multi-modal Remote Sensing Visual Question Answering Algorithm Based on Large Language Model","publication_year":2024,"publication_date":"2024-09-20","ids":{"openalex":"https://openalex.org/W4404740427","doi":"https://doi.org/10.1109/icbase63199.2024.10762433"},"language":"en","primary_location":{"id":"doi:10.1109/icbase63199.2024.10762433","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icbase63199.2024.10762433","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 5th International Conference on Big Data &amp;amp; Artificial Intelligence &amp;amp; Software Engineering (ICBASE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107836271","display_name":"S.-L. Qiu","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shengbang Qiu","raw_affiliation_strings":["Beijing Institute of Technology,School of Computer Science and Technology,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology,School of Computer Science and Technology,Beijing,China","institution_ids":["https://openalex.org/I125839683"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5107836271"],"corresponding_institution_ids":["https://openalex.org/I125839683"],"apc_list":null,"apc_paid":null,"fwci":5.7713,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.96498982,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"20","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10757","display_name":"Geographic Information Systems Studies","score":0.819100022315979,"subfield":{"id":"https://openalex.org/subfields/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10757","display_name":"Geographic Information Systems Studies","score":0.819100022315979,"subfield":{"id":"https://openalex.org/subfields/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13903","display_name":"Innovative Educational Techniques","score":0.7936999797821045,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12343","display_name":"Geography Education and Pedagogy","score":0.6917999982833862,"subfield":{"id":"https://openalex.org/subfields/3305","display_name":"Geography, Planning and Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7652814388275146},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.6899951100349426},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.6250597834587097},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4463990330696106},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4438304007053375},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.38370534777641296},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3581458628177643}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7652814388275146},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.6899951100349426},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.6250597834587097},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4463990330696106},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4438304007053375},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38370534777641296},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3581458628177643},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icbase63199.2024.10762433","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icbase63199.2024.10762433","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 5th International Conference on Big Data &amp;amp; Artificial Intelligence &amp;amp; Software Engineering (ICBASE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.550000011920929}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1895577753","https://openalex.org/W2064675550","https://openalex.org/W2510520237","https://openalex.org/W2592962403","https://openalex.org/W2745461083","https://openalex.org/W2779054585","https://openalex.org/W2920981979","https://openalex.org/W3017628311","https://openalex.org/W3194015448","https://openalex.org/W4385245566","https://openalex.org/W6791353385","https://openalex.org/W6810334672","https://openalex.org/W6849177959","https://openalex.org/W6851592950","https://openalex.org/W6851950068"],"related_works":["https://openalex.org/W2384605597","https://openalex.org/W2387743295","https://openalex.org/W2051487156","https://openalex.org/W3082787378","https://openalex.org/W2136007095","https://openalex.org/W2366230879","https://openalex.org/W4288267738","https://openalex.org/W2964413124","https://openalex.org/W4388937922","https://openalex.org/W3113264705"],"abstract_inverted_index":{"The":[0],"field":[1],"of":[2,16,33,48,52,64,94,110,144],"remote":[3,23,111,152,172],"sensing":[4,24,112,153,173],"image":[5,65,121],"applications":[6],"is":[7,128],"experiencing":[8],"unprecedented":[9],"attention,":[10],"particularly":[11],"with":[12],"the":[13,29,44,53,91,108,117,131,138,161],"emerging":[14],"rise":[15],"visual":[17],"question":[18],"answering":[19],"(VQA)":[20],"tasks":[21],"for":[22,137],"images.":[25,113],"However,":[26],"constrained":[27],"by":[28],"scale":[30,143],"and":[31,46,60,66,98,122,142],"diversity":[32,141],"existing":[34,145],"datasets,":[35,146],"traditional":[36],"approaches":[37],"often":[38],"rely":[39],"on":[40,83,169],"small-scale":[41],"models,":[42,103],"limiting":[43],"depth":[45],"breadth":[47],"understanding.":[49],"In":[50],"light":[51],"remarkable":[54],"advancements":[55],"in":[56,140,167],"large":[57,102],"language":[58],"models":[59],"their":[61,105],"vast":[62],"repository":[63],"semantic":[67,99],"knowledge,":[68],"we":[69,147],"innovatively":[70],"proposes":[71],"an":[72],"Adversarial":[73],"MultiModal":[74],"Remote":[75],"Sensing":[76],"Image":[77],"Visual":[78],"Question":[79],"Answering":[80],"algorithm":[81,162],"based":[82],"Large":[84],"Language":[85],"Model(MMRS).":[86],"It":[87],"aims":[88],"to":[89,107,135],"leverage":[90],"profound":[92],"understanding":[93],"natural":[95],"world":[96],"images":[97],"information":[100],"from":[101],"transferring":[104],"advantages":[106,166],"domain":[109],"To":[114],"further":[115],"enhance":[116],"alignment":[118],"accuracy":[119],"between":[120],"text":[123],"modalities,":[124],"a":[125,149],"discriminator":[126],"module":[127],"incorporated":[129],"into":[130],"MMRS":[132],"algorithm.":[133],"Moreover,":[134],"compensate":[136],"deficiencies":[139],"constructs":[148],"more":[150],"diverse":[151],"image-text":[154],"dataset":[155],"NWPU-GPT.":[156],"Experimental":[157],"results":[158],"demonstrate":[159],"that":[160],"exhibits":[163],"significant":[164],"performance":[165],"tests":[168],"multiple":[170],"classic":[171],"datasets.":[174]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
