{"id":"https://openalex.org/W4411485191","doi":"https://doi.org/10.1109/lgrs.2025.3581558","title":"Task Knowledge Injection: Training-Free Adaptation of Multimodal Large Language Models for Remote Sensing Image Understanding","display_name":"Task Knowledge Injection: Training-Free Adaptation of Multimodal Large Language Models for Remote Sensing Image Understanding","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4411485191","doi":"https://doi.org/10.1109/lgrs.2025.3581558"},"language":"en","primary_location":{"id":"doi:10.1109/lgrs.2025.3581558","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lgrs.2025.3581558","pdf_url":null,"source":{"id":"https://openalex.org/S126920919","display_name":"IEEE Geoscience and Remote Sensing Letters","issn_l":"1545-598X","issn":["1545-598X","1558-0571"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Geoscience and Remote Sensing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100398353","display_name":"Haifeng Li","orcid":"https://orcid.org/0000-0003-1173-6593"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haifeng Li","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028261944","display_name":"Qiujun Li","orcid":null},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiujun Li","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060417049","display_name":"Cheng Yang","orcid":"https://orcid.org/0000-0001-7821-0030"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng Yang","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114928929","display_name":"Wang Guo","orcid":"https://orcid.org/0009-0005-2478-2558"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wang Guo","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100393519","display_name":"Mengyao Li","orcid":"https://orcid.org/0000-0002-3284-3462"},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengyao Li","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114214614","display_name":"Hongyuan Yuan","orcid":null},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongyuan Yuan","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111334880","display_name":"Run Shao","orcid":null},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Run Shao","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005693926","display_name":"Chengli Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I139660479","display_name":"Central South University","ror":"https://ror.org/00f1zfq44","country_code":"CN","type":"education","lineage":["https://openalex.org/I139660479"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengli Peng","raw_affiliation_strings":["School of Geosciences and Info-Physics, Central South University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"School of Geosciences and Info-Physics, Central South University, Changsha, China","institution_ids":["https://openalex.org/I139660479"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100398353"],"corresponding_institution_ids":["https://openalex.org/I139660479"],"apc_list":null,"apc_paid":null,"fwci":1.3104,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.81896059,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"22","issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9835000038146973,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7894034385681152},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.6495269536972046},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6473996639251709},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.5947703123092651},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.5046931505203247},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.44222599267959595},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4147937595844269},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3672621250152588},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.3453493118286133},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3358875811100006},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.08496245741844177},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07960647344589233}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7894034385681152},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.6495269536972046},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6473996639251709},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.5947703123092651},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.5046931505203247},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.44222599267959595},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4147937595844269},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3672621250152588},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.3453493118286133},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3358875811100006},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.08496245741844177},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07960647344589233},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lgrs.2025.3581558","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lgrs.2025.3581558","pdf_url":null,"source":{"id":"https://openalex.org/S126920919","display_name":"IEEE Geoscience and Remote Sensing Letters","issn_l":"1545-598X","issn":["1545-598X","1558-0571"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Geoscience and Remote Sensing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2510520237","https://openalex.org/W2779054585","https://openalex.org/W3012111773","https://openalex.org/W3098351727","https://openalex.org/W3100245404","https://openalex.org/W3199693760","https://openalex.org/W4225630686","https://openalex.org/W4292968451","https://openalex.org/W4386065596","https://openalex.org/W4386065803","https://openalex.org/W4387723654","https://openalex.org/W4391305855","https://openalex.org/W4399837196","https://openalex.org/W4402776460","https://openalex.org/W4406138127","https://openalex.org/W6777615688","https://openalex.org/W6857872576","https://openalex.org/W6861778986","https://openalex.org/W6869661489","https://openalex.org/W6873875220"],"related_works":["https://openalex.org/W1564680838","https://openalex.org/W2003125260","https://openalex.org/W2060591604","https://openalex.org/W1992291644","https://openalex.org/W2166791242","https://openalex.org/W2585162246","https://openalex.org/W1934413089","https://openalex.org/W2098419343","https://openalex.org/W2051178964","https://openalex.org/W2989714914"],"abstract_inverted_index":{"Parameter":[0],"fine-tuning":[1],"is":[2,119,142],"the":[3,70,111,129,145,164,169,188],"mainstream":[4],"approach":[5,172],"for":[6,107],"adapting":[7],"Multimodal":[8],"Large":[9],"Langauge":[10],"Models":[11],"(MLLMs)":[12],"to":[13,77,121,192],"downstream":[14,34],"remote":[15],"sensing":[16],"tasks.":[17],"However,":[18],"such":[19],"method":[20,161],"risks":[21],"degrading":[22],"pre-trained":[23],"knowledge":[24,60,67,76,95,127,141],"and":[25,104,134,179],"also":[26],"incur":[27],"significant":[28],"costs.":[29],"This":[30],"paper":[31],"argues":[32],"that":[33,159],"adaptation":[35],"of":[36,42,168],"MLLMs":[37],"essentially":[38],"involves":[39],"effective":[40],"injection":[41,61],"task-specific":[43],"knowledge,":[44],"which":[45],"does":[46],"not":[47],"necessarily":[48],"require":[49],"parameter":[50],"updates.":[51],"Based":[52],"on":[53,187],"this":[54],"perspective,":[55],"we":[56,88],"propose":[57],"a":[58,65,90,102],"training-free":[59],"method.":[62],"By":[63],"constructing":[64],"multi-task":[66],"base":[68],"(MTKB),":[69],"model":[71],"can":[72],"dynamically":[73],"retrieve":[74],"task-related":[75],"serve":[78],"as":[79],"context":[80],"during":[81],"inference,":[82],"thereby":[83],"enhancing":[84],"its":[85],"understanding.":[86],"Specifically,":[87],"design":[89],"three-part":[91],"framework.":[92],"(1)":[93],"Task":[94],"construction:":[96],"Diverse":[97],"texts":[98],"are":[99],"unified":[100],"into":[101,144],"key":[103],"value":[105],"structure":[106],"image-text":[108],"matching,":[109],"forming":[110],"MTKB.":[112],"(2)":[113],"Two-stage":[114],"retrieval:":[115],"A":[116],"coarse-to-fine":[117],"process":[118],"employed":[120],"match":[122],"query":[123],"images":[124],"with":[125,185],"task":[126],"in":[128,177],"MTKB,":[130],"utilizing":[131],"both":[132],"unimodal":[133],"cross-modal":[135],"similarity.":[136],"(3)":[137],"Knowledge":[138],"injection:":[139],"Matched":[140],"integrated":[143],"MLLM":[146],"via":[147],"extended":[148],"embeddings,":[149],"without":[150],"altering":[151],"parameters.":[152],"Experimental":[153],"results":[154],"across":[155,182],"multiple":[156],"datasets":[157],"demonstrate":[158],"our":[160],"significantly":[162],"enhances":[163],"image":[165],"understanding":[166],"capabilities":[167],"model.":[170],"Our":[171],"achieves":[173],"about":[174],"5%":[175],"improvement":[176],"accuracy":[178],"related":[180],"metrics":[181],"several":[183],"datasets,":[184],"performance":[186],"RSVQ-LR":[189],"dataset":[190],"comparable":[191],"specialized":[193],"models.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
