{"id":"https://openalex.org/W4407941492","doi":"https://doi.org/10.3390/bdcc9030053","title":"Fine-Grained Local and Global Semantic Fusion for Multimodal Image\u2013Text Retrieval","display_name":"Fine-Grained Local and Global Semantic Fusion for Multimodal Image\u2013Text Retrieval","publication_year":2025,"publication_date":"2025-02-25","ids":{"openalex":"https://openalex.org/W4407941492","doi":"https://doi.org/10.3390/bdcc9030053"},"language":"en","primary_location":{"id":"doi:10.3390/bdcc9030053","is_oa":true,"landing_page_url":"https://doi.org/10.3390/bdcc9030053","pdf_url":"https://www.mdpi.com/2504-2289/9/3/53/pdf?version=1740494338","source":{"id":"https://openalex.org/S4210238752","display_name":"Big Data and Cognitive Computing","issn_l":"2504-2289","issn":["2504-2289"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data and Cognitive Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2504-2289/9/3/53/pdf?version=1740494338","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108008219","display_name":"Shaoliang Peng","orcid":"https://orcid.org/0000-0002-4647-2615"},"institutions":[{"id":"https://openalex.org/I49934816","display_name":"Hunan University of Technology","ror":"https://ror.org/04j3vr751","country_code":"CN","type":"education","lineage":["https://openalex.org/I49934816"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shenao Peng","raw_affiliation_strings":["College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China"],"affiliations":[{"raw_affiliation_string":"College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China","institution_ids":["https://openalex.org/I49934816"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101980926","display_name":"Zhongmei Wang","orcid":"https://orcid.org/0000-0003-0031-0925"},"institutions":[{"id":"https://openalex.org/I49934816","display_name":"Hunan University of Technology","ror":"https://ror.org/04j3vr751","country_code":"CN","type":"education","lineage":["https://openalex.org/I49934816"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhongmei Wang","raw_affiliation_strings":["College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China"],"affiliations":[{"raw_affiliation_string":"College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China","institution_ids":["https://openalex.org/I49934816"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100405318","display_name":"Jianhua Liu","orcid":"https://orcid.org/0000-0002-1694-0975"},"institutions":[{"id":"https://openalex.org/I49934816","display_name":"Hunan University of Technology","ror":"https://ror.org/04j3vr751","country_code":"CN","type":"education","lineage":["https://openalex.org/I49934816"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianhua Liu","raw_affiliation_strings":["College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China"],"affiliations":[{"raw_affiliation_string":"College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China","institution_ids":["https://openalex.org/I49934816"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041815973","display_name":"Changfan Zhang","orcid":"https://orcid.org/0000-0002-7439-1775"},"institutions":[{"id":"https://openalex.org/I49934816","display_name":"Hunan University of Technology","ror":"https://ror.org/04j3vr751","country_code":"CN","type":"education","lineage":["https://openalex.org/I49934816"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changfan Zhang","raw_affiliation_strings":["College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China"],"affiliations":[{"raw_affiliation_string":"College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China","institution_ids":["https://openalex.org/I49934816"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111517656","display_name":"Lin Jia","orcid":null},"institutions":[{"id":"https://openalex.org/I49934816","display_name":"Hunan University of Technology","ror":"https://ror.org/04j3vr751","country_code":"CN","type":"education","lineage":["https://openalex.org/I49934816"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Jia","raw_affiliation_strings":["College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China"],"affiliations":[{"raw_affiliation_string":"College of Railway Transportation, Hunan University of Technology, Zhuzhou 412007, China","institution_ids":["https://openalex.org/I49934816"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101980926"],"corresponding_institution_ids":["https://openalex.org/I49934816"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":1.3688,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.77657576,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"9","issue":"3","first_page":"53","last_page":"53"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9843000173568726,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9641000032424927,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6466243267059326},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6301278471946716},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.41829124093055725},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.41685158014297485},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.40303558111190796},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3936595022678375},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3927716612815857},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.120319664478302}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6466243267059326},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6301278471946716},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.41829124093055725},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.41685158014297485},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.40303558111190796},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3936595022678375},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3927716612815857},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.120319664478302},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/bdcc9030053","is_oa":true,"landing_page_url":"https://doi.org/10.3390/bdcc9030053","pdf_url":"https://www.mdpi.com/2504-2289/9/3/53/pdf?version=1740494338","source":{"id":"https://openalex.org/S4210238752","display_name":"Big Data and Cognitive Computing","issn_l":"2504-2289","issn":["2504-2289"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data and Cognitive Computing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b33895c3c5b0471f9595a54c0c5c3f3a","is_oa":true,"landing_page_url":"https://doaj.org/article/b33895c3c5b0471f9595a54c0c5c3f3a","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Big Data and Cognitive Computing, Vol 9, Iss 3, p 53 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/bdcc9030053","is_oa":true,"landing_page_url":"https://doi.org/10.3390/bdcc9030053","pdf_url":"https://www.mdpi.com/2504-2289/9/3/53/pdf?version=1740494338","source":{"id":"https://openalex.org/S4210238752","display_name":"Big Data and Cognitive Computing","issn_l":"2504-2289","issn":["2504-2289"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Big Data and Cognitive Computing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5393611267","display_name":null,"funder_award_id":"52272347","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4407941492.pdf"},"referenced_works_count":36,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1773149199","https://openalex.org/W2194775991","https://openalex.org/W2546696630","https://openalex.org/W2606473278","https://openalex.org/W2745461083","https://openalex.org/W2962964995","https://openalex.org/W2963389687","https://openalex.org/W2963988212","https://openalex.org/W2969656782","https://openalex.org/W2981586349","https://openalex.org/W2982078236","https://openalex.org/W2994818707","https://openalex.org/W3035212740","https://openalex.org/W3035454331","https://openalex.org/W3035552787","https://openalex.org/W3035588244","https://openalex.org/W3092820619","https://openalex.org/W3132789844","https://openalex.org/W3175888430","https://openalex.org/W3201877472","https://openalex.org/W3213100861","https://openalex.org/W4210894218","https://openalex.org/W4214819138","https://openalex.org/W4229626506","https://openalex.org/W4284698859","https://openalex.org/W4295679074","https://openalex.org/W4312761738","https://openalex.org/W4386071498","https://openalex.org/W4386071757","https://openalex.org/W4400490009","https://openalex.org/W4401754729","https://openalex.org/W4402360562","https://openalex.org/W4403334624","https://openalex.org/W6745537798","https://openalex.org/W6766970537"],"related_works":["https://openalex.org/W2099421762","https://openalex.org/W2530546662","https://openalex.org/W2967030268","https://openalex.org/W1986902711","https://openalex.org/W2396760013","https://openalex.org/W2148433556","https://openalex.org/W2171776552","https://openalex.org/W98391849","https://openalex.org/W1600907701","https://openalex.org/W2726741344"],"abstract_inverted_index":{"An":[0],"image\u2013text":[1],"retrieval":[2,37,145,151],"method":[3,132,139],"that":[4],"integrates":[5],"intramodal":[6,82],"fine-grained":[7,22],"local":[8,63],"semantic":[9,14,27],"information":[10,15],"and":[11,32,45,49,85,90,105,121,127,146],"intermodal":[12],"global":[13],"is":[16,54,69,98,107],"proposed":[17,131],"to":[18,60,100],"address":[19],"the":[20,26,40,77,102,119,125,130,137,156],"weak":[21],"discrimination":[23],"capabilities":[24],"for":[25,56,71,143,149],"features":[28,42],"located":[29],"between":[30],"image":[31,89,144],"text":[33,91],"modalities":[34],"in":[35],"cross-modal":[36],"tasks.":[38],"First,":[39],"original":[41],"of":[43,129],"images":[44],"texts":[46],"are":[47],"extracted,":[48],"a":[50,94],"graph":[51],"attention":[52,67],"network":[53],"employed":[55],"region":[57],"relationship":[58,83],"reasoning":[59],"obtain":[61],"relation-enhanced":[62],"features.":[64],"Then,":[65],"an":[66,110],"mechanism":[68],"used":[70,99],"different":[72],"semantically":[73,87],"interacting":[74],"samples":[75],"within":[76],"same":[78],"modality,":[79],"enabling":[80],"comprehensive":[81],"learning":[84],"producing":[86],"enhanced":[88,108],"embeddings.":[92],"Finally,":[93],"triplet":[95],"loss":[96],"function":[97],"train":[101],"entire":[103],"model,":[104],"it":[106],"with":[109],"angular":[111],"constraint.":[112],"Through":[113],"extensive":[114],"comparative":[115],"experiments":[116],"conducted":[117],"on":[118,152],"Flickr30K":[120],"MS-COCO":[122,153],"benchmark":[123],"datasets,":[124],"effectiveness":[126],"superiority":[128],"were":[133],"verified.":[134],"It":[135],"outperformed":[136],"current":[138],"by":[140],"6.4%":[141],"relatively":[142,148],"1.3%":[147],"caption":[150],"(Recall@1":[154],"using":[155],"1K":[157],"test":[158],"set).":[159]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
