{"id":"https://openalex.org/W4394712991","doi":"https://doi.org/10.1109/bigcomp60711.2024.00024","title":"Multimodal Knowledge Graph-Guided Cross-Modal Graph Network for Image-Text Retrieval","display_name":"Multimodal Knowledge Graph-Guided Cross-Modal Graph Network for Image-Text Retrieval","publication_year":2024,"publication_date":"2024-02-18","ids":{"openalex":"https://openalex.org/W4394712991","doi":"https://doi.org/10.1109/bigcomp60711.2024.00024"},"language":"en","primary_location":{"id":"doi:10.1109/bigcomp60711.2024.00024","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigcomp60711.2024.00024","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data and Smart Computing (BigComp)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047842812","display_name":"Jun\u2010Cheng Zheng","orcid":"https://orcid.org/0009-0009-5524-3994"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Juncheng Zheng","raw_affiliation_strings":["School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876"],"affiliations":[{"raw_affiliation_string":"School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056818951","display_name":"Meiyu Liang","orcid":"https://orcid.org/0000-0003-1835-1848"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meiyu Liang","raw_affiliation_strings":["School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876"],"affiliations":[{"raw_affiliation_string":"School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101798913","display_name":"Yang Yu","orcid":"https://orcid.org/0009-0000-4686-1170"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Yu","raw_affiliation_strings":["School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876"],"affiliations":[{"raw_affiliation_string":"School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100663187","display_name":"Junping Du","orcid":"https://orcid.org/0000-0001-8590-3767"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junping Du","raw_affiliation_strings":["School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876"],"affiliations":[{"raw_affiliation_string":"School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088046237","display_name":"Zhe Xue","orcid":"https://orcid.org/0000-0001-6123-0043"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhe Xue","raw_affiliation_strings":["School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876"],"affiliations":[{"raw_affiliation_string":"School of Computer Science (National Pilot Software Engineering School), Beijing University of Posts and Telecommunications,Beijing Key Laboratory of Intelligent Communication Software and Multimedia,Beijing,China,100876","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5047842812"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":0.7895,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.70599885,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"97","last_page":"100"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9606999754905701,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9595000147819519,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7266097664833069},{"id":"https://openalex.org/keywords/knowledge-graph","display_name":"Knowledge graph","score":0.5855810046195984},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5852601528167725},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5701504349708557},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4171898663043976},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4121393859386444},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2857523560523987}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7266097664833069},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.5855810046195984},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5852601528167725},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5701504349708557},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4171898663043976},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4121393859386444},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2857523560523987},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigcomp60711.2024.00024","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigcomp60711.2024.00024","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data and Smart Computing (BigComp)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2739181657","https://openalex.org/W2937703861","https://openalex.org/W2962964995","https://openalex.org/W2964727037","https://openalex.org/W2988823324","https://openalex.org/W3010277541","https://openalex.org/W3101540864","https://openalex.org/W3110042533","https://openalex.org/W3148395438","https://openalex.org/W4214819138","https://openalex.org/W4312877428","https://openalex.org/W4317436342","https://openalex.org/W6741383107"],"related_works":["https://openalex.org/W2379392295","https://openalex.org/W3160965418","https://openalex.org/W613940353","https://openalex.org/W2320915480","https://openalex.org/W2362990116","https://openalex.org/W2381300099","https://openalex.org/W2714992399","https://openalex.org/W2383812217","https://openalex.org/W2326515389","https://openalex.org/W2054026175"],"abstract_inverted_index":{"Image-text":[0],"retrieval":[1,23,235],"is":[2],"a":[3,160,199],"fundamental":[4],"cross-modal":[5,35,59,84,171,208,217],"task,":[6],"which":[7,98,148],"dedicates":[8],"to":[9,57,82,101,122,159,211],"align":[10],"the":[11,152,185,196,203,213,221],"representation":[12,153],"space":[13,154,214],"between":[14],"image":[15,26,133],"modality":[16],"and":[17,27,37,86,95,105,117,135,150,157,168,188,193,206,223],"text":[18,136],"modality.":[19],"Existing":[20],"cross-interactive":[21],"image-text":[22,234],"methods":[24],"generate":[25,93,107],"sentence":[28],"em-beddings":[29],"independently,":[30],"introduce":[31],"interaction-based":[32],"networks":[33],"for":[34,178],"reasoning,":[36],"then":[38],"retrieve":[39],"them":[40],"using":[41],"matching":[42],"metrics.":[43],"However,":[44],"existing":[45],"approaches":[46],"do":[47],"not":[48],"consider":[49],"fully":[50],"utilizing":[51],"semantic":[52,62,94,113,180],"relationships":[53,85,190],"among":[54],"multimodal":[55,79],"knowledge":[56,80],"enhance":[58,87],"fine-grained":[60,170],"implicit":[61,186],"reasoning":[63,125],"capabilities.":[64],"In":[65,90],"this":[66],"paper,":[67],"we":[68,128,183],"propose":[69],"Multimodal":[70,144],"Knowledge":[71,145],"Graph-guided":[72],"Cross-modal":[73],"Graph":[74,146],"Network":[75],"(MKCGN)":[76],"that":[77,228],"exploits":[78],"graphs":[81,109,119],"explore":[83],"global":[88,204],"representations.":[89,218],"MKCGN,":[91],"images":[92,192],"spatial":[96],"graphs,":[97,104],"are":[99,120],"used":[100,121],"represent":[102],"visual":[103,116],"sentences":[106],"textual":[108,118],"based":[110,138],"on":[111,139,220],"word":[112],"relations.":[114],"The":[115],"implement":[123],"inter-modal":[124,166,179],"respectively.":[126],"Then":[127],"obtain":[129],"interest":[130],"embeddings":[131],"of":[132,155,191,201,215],"regions":[134,156],"words":[137,158],"entity":[140],"embed":[141],"dings":[142],"in":[143],"(MKG),":[147],"approximates":[149],"aligns":[151],"certain":[161],"extent,":[162],"thus":[163],"obtaining":[164],"effective":[165],"interactions":[167],"learning":[169],"communication":[172],"through":[173,195],"graph":[174],"node":[175],"contrast":[176,209],"loss":[177,210],"reasoning.":[181],"Finally,":[182],"mine":[184],"semantics":[187],"potential":[189],"texts":[194],"MKG":[197],"as":[198],"means":[200],"enhancing":[202],"representations":[205],"use":[207],"narrow":[212],"coarse-grained":[216],"Experiments":[219],"MS-COCO":[222],"Flickr30K":[224],"benchmark":[225],"datasets":[226],"show":[227],"our":[229],"proposed":[230],"MKCGN":[231],"outperforms":[232],"state-of-the-art":[233],"methods.":[236]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
