{"id":"https://openalex.org/W4391136447","doi":"https://doi.org/10.3390/rs16030441","title":"Machine-to-Machine Visual Dialoguing with ChatGPT for Enriched Textual Image Description","display_name":"Machine-to-Machine Visual Dialoguing with ChatGPT for Enriched Textual Image Description","publication_year":2024,"publication_date":"2024-01-23","ids":{"openalex":"https://openalex.org/W4391136447","doi":"https://doi.org/10.3390/rs16030441"},"language":"en","primary_location":{"id":"doi:10.3390/rs16030441","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs16030441","pdf_url":"https://www.mdpi.com/2072-4292/16/3/441/pdf?version=1706008784","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2072-4292/16/3/441/pdf?version=1706008784","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004777179","display_name":"Riccardo Ricci","orcid":"https://orcid.org/0000-0002-2128-7456"},"institutions":[{"id":"https://openalex.org/I193223587","display_name":"University of Trento","ror":"https://ror.org/05trd4x28","country_code":"IT","type":"education","lineage":["https://openalex.org/I193223587"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Riccardo Ricci","raw_affiliation_strings":["Department of Information Engineering and Computer Science, University of Trento, 38123 Trento, Italy"],"raw_orcid":"https://orcid.org/0000-0002-2128-7456","affiliations":[{"raw_affiliation_string":"Department of Information Engineering and Computer Science, University of Trento, 38123 Trento, Italy","institution_ids":["https://openalex.org/I193223587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054237841","display_name":"Yakoub Bazi","orcid":"https://orcid.org/0000-0001-9287-0596"},"institutions":[{"id":"https://openalex.org/I28022161","display_name":"King Saud University","ror":"https://ror.org/02f81g417","country_code":"SA","type":"education","lineage":["https://openalex.org/I28022161"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Yakoub Bazi","raw_affiliation_strings":["Department of Computer Engineering, College of Computer and Information Sciences, King Saud University, Riyadh 4545, Saudi Arabia"],"raw_orcid":"https://orcid.org/0000-0001-9287-0596","affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, College of Computer and Information Sciences, King Saud University, Riyadh 4545, Saudi Arabia","institution_ids":["https://openalex.org/I28022161"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021389231","display_name":"Farid Melgani","orcid":"https://orcid.org/0000-0001-9745-3732"},"institutions":[{"id":"https://openalex.org/I193223587","display_name":"University of Trento","ror":"https://ror.org/05trd4x28","country_code":"IT","type":"education","lineage":["https://openalex.org/I193223587"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Farid Melgani","raw_affiliation_strings":["Department of Information Engineering and Computer Science, University of Trento, 38123 Trento, Italy"],"raw_orcid":"https://orcid.org/0000-0001-9745-3732","affiliations":[{"raw_affiliation_string":"Department of Information Engineering and Computer Science, University of Trento, 38123 Trento, Italy","institution_ids":["https://openalex.org/I193223587"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5021389231"],"corresponding_institution_ids":["https://openalex.org/I193223587"],"apc_list":{"value":2500,"currency":"CHF","value_usd":2707},"apc_paid":{"value":2500,"currency":"CHF","value_usd":2707},"fwci":2.6557,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.90676562,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"16","issue":"3","first_page":"441","last_page":"441"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9872999787330627,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6568272709846497},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5394222736358643},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43794745206832886},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.37676554918289185}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6568272709846497},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5394222736358643},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43794745206832886},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.37676554918289185}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/rs16030441","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs16030441","pdf_url":"https://www.mdpi.com/2072-4292/16/3/441/pdf?version=1706008784","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},{"id":"pmh:oai:iris.unitn.it:11572/437939","is_oa":true,"landing_page_url":"https://www.mdpi.com/2072-4292/16/3/441","pdf_url":"https://www.mdpi.com/2072-4292/16/3/441/pdf","source":{"id":"https://openalex.org/S4306401913","display_name":"Institutional Research Information System (Universit\u00e0 degli Studi di Trento)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I193223587","host_organization_name":"University of Trento","host_organization_lineage":["https://openalex.org/I193223587"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:doaj.org/article:83018d99f9414cf3a0c89dfe14b2a685","is_oa":true,"landing_page_url":"https://doaj.org/article/83018d99f9414cf3a0c89dfe14b2a685","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Remote Sensing, Vol 16, Iss 3, p 441 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/rs16030441","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs16030441","pdf_url":"https://www.mdpi.com/2072-4292/16/3/441/pdf?version=1706008784","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7900000214576721}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4391136447.pdf"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W1933349210","https://openalex.org/W1983927101","https://openalex.org/W2157331557","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2510520237","https://openalex.org/W2603566245","https://openalex.org/W2607059968","https://openalex.org/W2779054585","https://openalex.org/W2889606145","https://openalex.org/W2920981979","https://openalex.org/W2979924880","https://openalex.org/W3012111773","https://openalex.org/W3015625772","https://openalex.org/W3029273706","https://openalex.org/W3098351727","https://openalex.org/W3100245404","https://openalex.org/W3153469116","https://openalex.org/W3196922338","https://openalex.org/W4229439310","https://openalex.org/W4285818301","https://openalex.org/W4289537913","https://openalex.org/W4292828962","https://openalex.org/W4292968451","https://openalex.org/W4312272867","https://openalex.org/W4312915946","https://openalex.org/W4360930321","https://openalex.org/W6800425103","https://openalex.org/W6810920957","https://openalex.org/W6841412193","https://openalex.org/W6842763721"],"related_works":["https://openalex.org/W2755342338","https://openalex.org/W2058170566","https://openalex.org/W2036807459","https://openalex.org/W2775347418","https://openalex.org/W1969923398","https://openalex.org/W2772917594","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2079911747"],"abstract_inverted_index":{"Image":[0],"captioning":[1,62,97],"is":[2,63],"a":[3,53,67,96,106,128,133],"technique":[4],"that":[5,77],"enables":[6],"the":[7,15,21,26,36,49,73,138,153,160],"automatic":[8],"extraction":[9],"of":[10,17,28,58,121,155,162],"natural":[11,29],"language":[12,30],"descriptions":[13,120],"about":[14],"contents":[16],"an":[18,157],"image.":[19],"On":[20],"one":[22,91],"hand,":[23],"information":[24,76,164],"in":[25,159],"form":[27,57],"can":[31],"enhance":[32],"accessibility":[33],"by":[34,94,132],"reducing":[35],"expertise":[37],"required":[38],"to":[39,66,89,108,115],"process,":[40],"analyze,":[41],"and":[42,55,110,118,136,167,171],"exploit":[43],"remote":[44,80,149],"sensing":[45,81,150],"images,":[46],"while":[47],"on":[48,127,146],"other,":[50],"it":[51],"provides":[52],"direct":[54],"general":[56],"communication.":[59],"However,":[60],"image":[61,135],"usually":[64],"restricted":[65],"single":[68],"sentence,":[69],"which":[70],"barely":[71],"describes":[72],"rich":[74],"semantic":[75,163],"typically":[78],"characterizes":[79],"(RS)":[82],"images.":[83],"In":[84],"this":[85],"paper,":[86],"we":[87],"aim":[88],"move":[90],"step":[92],"forward":[93],"proposing":[95],"system":[98,125],"that,":[99],"mimicking":[100],"human":[101],"behavior,":[102],"adopts":[103],"dialogue":[104,139],"as":[105,173,175],"tool":[107],"explore":[109],"dig":[111],"for":[112],"information,":[113],"leading":[114],"more":[116],"detailed":[117],"comprehensive":[119],"RS":[122],"scenes.":[123],"The":[124],"relies":[126],"questions\u2013answers":[129],"scheme":[130],"fed":[131],"query":[134],"summarizes":[137],"content":[140],"with":[141],"ChatGPT.":[142],"Experiments":[143],"carried":[144],"out":[145],"two":[147],"benchmark":[148],"datasets":[151],"confirm":[152],"potential":[154],"such":[156],"approach":[158],"context":[161],"mining.":[165],"Strengths":[166],"weaknesses":[168],"are":[169],"highlighted":[170],"discussed,":[172],"well":[174],"some":[176],"possible":[177],"future":[178],"developments.":[179]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":6}],"updated_date":"2026-06-03T09:05:47.796612","created_date":"2025-10-10T00:00:00"}
