{"id":"https://openalex.org/W4411408475","doi":"https://doi.org/10.1109/jstars.2025.3580686","title":"Semantic\u2013Spatial Feature Fusion With Dynamic Graph Refinement for Remote Sensing Image Captioning","display_name":"Semantic\u2013Spatial Feature Fusion With Dynamic Graph Refinement for Remote Sensing Image Captioning","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4411408475","doi":"https://doi.org/10.1109/jstars.2025.3580686"},"language":"en","primary_location":{"id":"doi:10.1109/jstars.2025.3580686","is_oa":true,"landing_page_url":"https://doi.org/10.1109/jstars.2025.3580686","pdf_url":null,"source":{"id":"https://openalex.org/S117727964","display_name":"IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing","issn_l":"1939-1404","issn":["1939-1404","2151-1535"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/jstars.2025.3580686","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021380974","display_name":"Maofu Liu","orcid":"https://orcid.org/0000-0002-3732-4354"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Maofu Liu","raw_affiliation_strings":["School of Computer Science and Technology, Wuhan University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Wuhan University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I43922553"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiahui Liu","orcid":"https://orcid.org/0009-0008-9693-0734"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiahui Liu","raw_affiliation_strings":["School of Computer Science and Technology, Wuhan University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Wuhan University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I43922553"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5115593470","display_name":"Xiaokang Zhang","orcid":"https://orcid.org/0000-0002-6127-4801"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaokang Zhang","raw_affiliation_strings":["School of Information Science and Engineering, Wuhan University of Science and Technology, Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Engineering, Wuhan University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I43922553"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5021380974"],"corresponding_institution_ids":["https://openalex.org/I43922553"],"apc_list":{"value":1250,"currency":"USD","value_usd":1250},"apc_paid":{"value":1250,"currency":"USD","value_usd":1250},"fwci":3.6542,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.93200353,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"18","issue":null,"first_page":"15442","last_page":"15455"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.876213550567627},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8065961003303528},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5717338919639587},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.5479183793067932},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5464951992034912},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5427887439727783},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.46300485730171204},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.44229868054389954},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.42355817556381226},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.417267769575119},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4115244448184967},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3726978302001953},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.33072003722190857},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.1718102991580963}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.876213550567627},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8065961003303528},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5717338919639587},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.5479183793067932},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5464951992034912},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5427887439727783},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.46300485730171204},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.44229868054389954},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.42355817556381226},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.417267769575119},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4115244448184967},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3726978302001953},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.33072003722190857},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.1718102991580963},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/jstars.2025.3580686","is_oa":true,"landing_page_url":"https://doi.org/10.1109/jstars.2025.3580686","pdf_url":null,"source":{"id":"https://openalex.org/S117727964","display_name":"IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing","issn_l":"1939-1404","issn":["1939-1404","2151-1535"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:e0754bcfb3d64c7ba19db2ccf1ce9424","is_oa":true,"landing_page_url":"https://doaj.org/article/e0754bcfb3d64c7ba19db2ccf1ce9424","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing, Vol 18, Pp 15442-15455 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/jstars.2025.3580686","is_oa":true,"landing_page_url":"https://doi.org/10.1109/jstars.2025.3580686","pdf_url":null,"source":{"id":"https://openalex.org/S117727964","display_name":"IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing","issn_l":"1939-1404","issn":["1939-1404","2151-1535"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4669320296","display_name":null,"funder_award_id":"42371374","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W1895577753","https://openalex.org/W1956340063","https://openalex.org/W2101105183","https://openalex.org/W2506483933","https://openalex.org/W2510520237","https://openalex.org/W2603566245","https://openalex.org/W2745461083","https://openalex.org/W2779054585","https://openalex.org/W2904551248","https://openalex.org/W2911584214","https://openalex.org/W2920981979","https://openalex.org/W2963084599","https://openalex.org/W2979924880","https://openalex.org/W2997056851","https://openalex.org/W3004561134","https://openalex.org/W3011916860","https://openalex.org/W3015625772","https://openalex.org/W3034655362","https://openalex.org/W3046675509","https://openalex.org/W3048631361","https://openalex.org/W3117344638","https://openalex.org/W3154766321","https://openalex.org/W3194015448","https://openalex.org/W3216130706","https://openalex.org/W4206111836","https://openalex.org/W4211112734","https://openalex.org/W4214587440","https://openalex.org/W4226285265","https://openalex.org/W4317433994","https://openalex.org/W4318681845","https://openalex.org/W4380763457","https://openalex.org/W4385245566","https://openalex.org/W4386003541","https://openalex.org/W4387986561","https://openalex.org/W4390539794","https://openalex.org/W4390788051","https://openalex.org/W4390873076","https://openalex.org/W4391226826","https://openalex.org/W4391305855","https://openalex.org/W4391341588","https://openalex.org/W4392543906","https://openalex.org/W4394585954","https://openalex.org/W4394804940","https://openalex.org/W4396941249","https://openalex.org/W4399399400","https://openalex.org/W4400977318","https://openalex.org/W4403183405","https://openalex.org/W4403210463","https://openalex.org/W4404563351","https://openalex.org/W4405023205","https://openalex.org/W4405625226","https://openalex.org/W4407152340","https://openalex.org/W4408145414","https://openalex.org/W4409383105","https://openalex.org/W6678262379","https://openalex.org/W6682631176","https://openalex.org/W6763643401","https://openalex.org/W6861046571"],"related_works":["https://openalex.org/W2132659060","https://openalex.org/W2031992971","https://openalex.org/W2788731446","https://openalex.org/W2204403038","https://openalex.org/W3214791684","https://openalex.org/W3152170969","https://openalex.org/W2379054866","https://openalex.org/W2370195708","https://openalex.org/W1490651872","https://openalex.org/W2139242969"],"abstract_inverted_index":{"Remote":[0],"sensing":[1,20],"image":[2,62],"captioning":[3],"aims":[4],"to":[5,14,60,114,146],"generate":[6],"semantically":[7],"accurate":[8],"descriptions":[9],"that":[10,56,142],"are":[11,57,143],"closely":[12],"linked":[13],"the":[15,39,61,83,122,130,147,156,162,165,175,178],"visual":[16,29,47],"features":[17,30,113],"of":[18,28,42,164,177],"remote":[19],"images.":[21],"Existing":[22],"approaches":[23],"typically":[24],"emphasize":[25],"fine-grained":[26],"extraction":[27],"and":[31,49,88,111,118,150],"capturing":[32],"global":[33],"information.":[34,120],"However,":[35],"they":[36],"often":[37],"overlook":[38],"complementary":[40],"role":[41],"textual":[43],"information":[44],"in":[45,52],"enhancing":[46],"semantics":[48],"face":[50],"challenges":[51],"precisely":[53],"locating":[54],"objects":[55,141],"most":[58,144],"relevant":[59,145],"context.":[63],"To":[64],"address":[65],"these":[66],"challenges,":[67],"this":[68],"paper":[69],"presents":[70],"a":[71,99,125,136],"semantic-spatial":[72,84],"feature":[73,85,91,101,133],"fusion":[74,86],"with":[75],"dynamic":[76,89,137],"graph":[77,90,126],"refinement":[78,92],"(SFDR)":[79],"method,":[80],"which":[81],"integrates":[82],"(SSFF)":[87],"(DGFR)":[93],"modules.":[94],"The":[95,181],"SSFF":[96],"module":[97],"utilizes":[98],"multi-level":[100],"representation":[102],"strategy":[103],"by":[104],"leveraging":[105],"pre-trained":[106],"CLIP":[107],"features,":[108,110],"grid":[109],"ROI":[112],"integrate":[115],"rich":[116],"semantic":[117],"spatial":[119],"In":[121],"DGFR":[123],"module,":[124],"attention":[127],"network":[128],"captures":[129],"relationships":[131],"between":[132],"nodes,":[134],"while":[135],"weighting":[138],"mechanism":[139],"prioritizes":[140],"current":[148],"scene":[149],"suppresses":[151],"less":[152],"significant":[153],"ones.":[154],"Therefore,":[155],"proposed":[157,179],"SFDR":[158],"method":[159],"significantly":[160],"enhances":[161],"quality":[163],"generated":[166],"descriptions.":[167],"Experimental":[168],"results":[169],"on":[170],"three":[171],"benchmark":[172],"datasets":[173],"demonstrate":[174],"effectiveness":[176],"method.":[180],"source":[182],"code":[183],"will":[184],"be":[185],"available":[186],"at":[187],"<uri":[188],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[189],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/zxk688/SFDR</uri>.":[190]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-06-19T00:00:00"}
