{"id":"https://openalex.org/W4304084117","doi":"https://doi.org/10.1145/3503161.3548058","title":"Image-Text Matching with Fine-Grained Relational Dependency and Bidirectional Attention-Based Generative Networks","display_name":"Image-Text Matching with Fine-Grained Relational Dependency and Bidirectional Attention-Based Generative Networks","publication_year":2022,"publication_date":"2022-10-10","ids":{"openalex":"https://openalex.org/W4304084117","doi":"https://doi.org/10.1145/3503161.3548058"},"language":"en","primary_location":{"id":"doi:10.1145/3503161.3548058","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3503161.3548058","pdf_url":null,"source":{"id":"https://openalex.org/S4363608757","display_name":"Proceedings of the 30th ACM International Conference on Multimedia","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053196390","display_name":"Jianwei Zhu","orcid":"https://orcid.org/0000-0002-8272-9190"},"institutions":[{"id":"https://openalex.org/I29739308","display_name":"Guangxi Normal University","ror":"https://ror.org/02frt9q65","country_code":"CN","type":"education","lineage":["https://openalex.org/I29739308"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jianwei Zhu","raw_affiliation_strings":["Guangxi Normal University, Guilin, China"],"affiliations":[{"raw_affiliation_string":"Guangxi Normal University, Guilin, China","institution_ids":["https://openalex.org/I29739308"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100701695","display_name":"Zhixin Li","orcid":"https://orcid.org/0000-0002-5313-6134"},"institutions":[{"id":"https://openalex.org/I29739308","display_name":"Guangxi Normal University","ror":"https://ror.org/02frt9q65","country_code":"CN","type":"education","lineage":["https://openalex.org/I29739308"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhixin Li","raw_affiliation_strings":["Guangxi Normal University, Guilin, China"],"affiliations":[{"raw_affiliation_string":"Guangxi Normal University, Guilin, China","institution_ids":["https://openalex.org/I29739308"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061609383","display_name":"Yufei Zeng","orcid":null},"institutions":[{"id":"https://openalex.org/I29739308","display_name":"Guangxi Normal University","ror":"https://ror.org/02frt9q65","country_code":"CN","type":"education","lineage":["https://openalex.org/I29739308"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yufei Zeng","raw_affiliation_strings":["Guangxi Normal University, Guilin, China"],"affiliations":[{"raw_affiliation_string":"Guangxi Normal University, Guilin, China","institution_ids":["https://openalex.org/I29739308"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076598143","display_name":"Jiahui Wei","orcid":"https://orcid.org/0009-0005-8060-2929"},"institutions":[{"id":"https://openalex.org/I29739308","display_name":"Guangxi Normal University","ror":"https://ror.org/02frt9q65","country_code":"CN","type":"education","lineage":["https://openalex.org/I29739308"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiahui Wei","raw_affiliation_strings":["Guangxi Normal University, Guilin, China"],"affiliations":[{"raw_affiliation_string":"Guangxi Normal University, Guilin, China","institution_ids":["https://openalex.org/I29739308"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053794277","display_name":"Huifang Ma","orcid":"https://orcid.org/0000-0002-5104-8982"},"institutions":[{"id":"https://openalex.org/I68986083","display_name":"Northwest Normal University","ror":"https://ror.org/00gx3j908","country_code":"CN","type":"education","lineage":["https://openalex.org/I68986083"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huifang Ma","raw_affiliation_strings":["Northwest Normal University, Lanzhou, China"],"affiliations":[{"raw_affiliation_string":"Northwest Normal University, Lanzhou, China","institution_ids":["https://openalex.org/I68986083"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5053196390"],"corresponding_institution_ids":["https://openalex.org/I29739308"],"apc_list":null,"apc_paid":null,"fwci":1.9177,"has_fulltext":false,"cited_by_count":32,"citation_normalized_percentile":{"value":0.90603166,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"395","last_page":"403"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7763837575912476},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6472941040992737},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.6395261287689209},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5757867097854614},{"id":"https://openalex.org/keywords/mutual-information","display_name":"Mutual information","score":0.5554839968681335},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.542281985282898},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5234850645065308},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5116612911224365},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.49012836813926697},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.4789572060108185},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4785502552986145},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.4725876748561859},{"id":"https://openalex.org/keywords/semantic-matching","display_name":"Semantic matching","score":0.4686927795410156},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4401416480541229},{"id":"https://openalex.org/keywords/expression","display_name":"Expression (computer science)","score":0.4249809980392456},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3895551562309265},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3759608268737793},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.2206639051437378},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10445928573608398}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7763837575912476},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6472941040992737},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.6395261287689209},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5757867097854614},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.5554839968681335},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.542281985282898},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5234850645065308},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5116612911224365},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.49012836813926697},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.4789572060108185},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4785502552986145},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.4725876748561859},{"id":"https://openalex.org/C2778493491","wikidata":"https://www.wikidata.org/wiki/Q7449072","display_name":"Semantic matching","level":3,"score":0.4686927795410156},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4401416480541229},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.4249809980392456},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3895551562309265},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3759608268737793},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2206639051437378},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10445928573608398},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3503161.3548058","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3503161.3548058","pdf_url":null,"source":{"id":"https://openalex.org/S4363608757","display_name":"Proceedings of the 30th ACM International Conference on Multimedia","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2953015661","display_name":null,"funder_award_id":"61966004, 61866004","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1861492603","https://openalex.org/W1895577753","https://openalex.org/W1905882502","https://openalex.org/W2024539680","https://openalex.org/W2102605133","https://openalex.org/W2158289097","https://openalex.org/W2185175083","https://openalex.org/W2187089797","https://openalex.org/W2250539671","https://openalex.org/W2613718673","https://openalex.org/W2745461083","https://openalex.org/W2932399282","https://openalex.org/W2962964995","https://openalex.org/W2963389687","https://openalex.org/W2963467339","https://openalex.org/W2963966654","https://openalex.org/W2964024144","https://openalex.org/W2964080601","https://openalex.org/W2964216321","https://openalex.org/W2982078236","https://openalex.org/W2988823324","https://openalex.org/W2994818707","https://openalex.org/W3010277541","https://openalex.org/W3035454331","https://openalex.org/W3088172692","https://openalex.org/W3096407995","https://openalex.org/W3202572107","https://openalex.org/W3202748396","https://openalex.org/W4205357838","https://openalex.org/W4385245566","https://openalex.org/W6601955380","https://openalex.org/W6739901393"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W4380551139","https://openalex.org/W4317695495","https://openalex.org/W4395044357","https://openalex.org/W4287117424","https://openalex.org/W4387506531","https://openalex.org/W2087346071","https://openalex.org/W2967848559","https://openalex.org/W4299831724"],"abstract_inverted_index":{"Generally,":[0],"most":[1],"existing":[2],"cross-modal":[3],"retrieval":[4],"methods":[5],"only":[6],"consider":[7],"global":[8,113],"or":[9],"local":[10,90,95],"semantic":[11],"embeddings,":[12],"lacking":[13],"fine-grained":[14],"dependencies":[15,64],"between":[16,30,65,81,134],"objects.":[17,66,135],"At":[18],"the":[19,27,34,78,84,94,98,102,112,116,144],"same":[20],"time,":[21],"it":[22,69],"is":[23,87,105],"usually":[24],"ignored":[25],"that":[26,143],"mutual":[28,79,108],"transformation":[29,80,109],"modalities":[31],"also":[32,121],"facilitates":[33],"embedding":[35,49,127],"of":[36,97,115,146],"modalities.":[37,82,117],"Given":[38],"these":[39],"problems,":[40],"we":[41,120],"propose":[42,122],"a":[43,56,71,123],"method":[44,148],"called":[45],"BiKA":[46],"(Bidirectional":[47],"Knowledge-assisted":[48],"and":[50],"Attention-based":[51],"generation).":[52],"The":[53,136],"model":[54],"uses":[55],"bidirectional":[57,72],"graph":[58,86],"convolutional":[59],"neural":[60],"network":[61,75,104,128],"to":[62,76,92,110,129,154],"establish":[63],"In":[67,118],"addition,":[68,119],"employs":[70],"attention-based":[73],"generative":[74,103],"achieve":[77],"Specifically,":[83],"knowledge":[85],"used":[88,106],"for":[89,107],"matching":[91],"constrain":[93,111],"expression":[96,114],"modalities,":[99],"in":[100],"which":[101],"new":[124],"position":[125,131],"relation":[126,132],"embed":[130],"information":[133],"experiments":[137],"on":[138],"two":[139],"public":[140],"datasets":[141],"show":[142],"performance":[145],"our":[147],"has":[149],"been":[150],"dramatically":[151],"improved":[152],"compared":[153],"many":[155],"state-of-the-art":[156],"models.":[157]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":15},{"year":2023,"cited_by_count":11}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
