{"id":"https://openalex.org/W3008356057","doi":"https://doi.org/10.1109/access.2020.2975594","title":"Multi-Modal Memory Enhancement Attention Network for Image-Text Matching","display_name":"Multi-Modal Memory Enhancement Attention Network for Image-Text Matching","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3008356057","doi":"https://doi.org/10.1109/access.2020.2975594","mag":"3008356057"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.2975594","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.2975594","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09006782.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09006782.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005367680","display_name":"Zhong Ji","orcid":"https://orcid.org/0000-0002-2197-3739"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhong Ji","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0002-2197-3739","affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000199509","display_name":"Zhigang Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhigang Lin","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100324809","display_name":"Haoran Wang","orcid":"https://orcid.org/0000-0001-6350-5645"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoran Wang","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100654741","display_name":"Yuqing He","orcid":"https://orcid.org/0000-0003-1666-4330"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuqing He","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0003-1666-4330","affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5005367680"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":1.0788,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.7934518,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"8","issue":null,"first_page":"38438","last_page":"38447"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8642379641532898},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6220844984054565},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5477260947227478},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5449525117874146},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5438362956047058},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5242053270339966},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5124693512916565},{"id":"https://openalex.org/keywords/memorization","display_name":"Memorization","score":0.45982125401496887},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4340205788612366},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.41553959250450134},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.35505521297454834},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.0943945050239563}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8642379641532898},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6220844984054565},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5477260947227478},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5449525117874146},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5438362956047058},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5242053270339966},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5124693512916565},{"id":"https://openalex.org/C30038468","wikidata":"https://www.wikidata.org/wiki/Q4354775","display_name":"Memorization","level":2,"score":0.45982125401496887},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4340205788612366},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.41553959250450134},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.35505521297454834},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0943945050239563},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2020.2975594","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.2975594","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09006782.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:2d72a124de2e401fb411156abdc5860d","is_oa":true,"landing_page_url":"https://doaj.org/article/2d72a124de2e401fb411156abdc5860d","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 38438-38447 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.2975594","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.2975594","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09006782.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6299999952316284,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G3635174350","display_name":null,"funder_award_id":"19JCYBJC16000","funder_id":"https://openalex.org/F4320323993","funder_display_name":"Natural Science Foundation of Tianjin City"},{"id":"https://openalex.org/G3732680637","display_name":null,"funder_award_id":"61771329","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4256591871","display_name":null,"funder_award_id":"61771329","funder_id":"https://openalex.org/F4320323993","funder_display_name":"Natural Science Foundation of Tianjin City"},{"id":"https://openalex.org/G8502464038","display_name":null,"funder_award_id":"19JCYBJC16000","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323993","display_name":"Natural Science Foundation of Tianjin City","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3008356057.pdf","grobid_xml":"https://content.openalex.org/works/W3008356057.grobid-xml"},"referenced_works_count":76,"referenced_works":["https://openalex.org/W1514535095","https://openalex.org/W1522301498","https://openalex.org/W1527575280","https://openalex.org/W1614298861","https://openalex.org/W1773149199","https://openalex.org/W1811254738","https://openalex.org/W1861492603","https://openalex.org/W1905882502","https://openalex.org/W1916445035","https://openalex.org/W1957706851","https://openalex.org/W2099857613","https://openalex.org/W2112912048","https://openalex.org/W2123024445","https://openalex.org/W2133564696","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2277195237","https://openalex.org/W2293453011","https://openalex.org/W2546696630","https://openalex.org/W2554906389","https://openalex.org/W2606473278","https://openalex.org/W2737766105","https://openalex.org/W2739181657","https://openalex.org/W2752782242","https://openalex.org/W2798280084","https://openalex.org/W2799263800","https://openalex.org/W2883311563","https://openalex.org/W2892573207","https://openalex.org/W2894786240","https://openalex.org/W2900953995","https://openalex.org/W2913639291","https://openalex.org/W2913943056","https://openalex.org/W2936420065","https://openalex.org/W2942614241","https://openalex.org/W2950577311","https://openalex.org/W2951008357","https://openalex.org/W2956018683","https://openalex.org/W2962706528","https://openalex.org/W2962781483","https://openalex.org/W2962851485","https://openalex.org/W2962964995","https://openalex.org/W2963040148","https://openalex.org/W2963389687","https://openalex.org/W2963420686","https://openalex.org/W2963448850","https://openalex.org/W2963467339","https://openalex.org/W2963495494","https://openalex.org/W2963526065","https://openalex.org/W2963680240","https://openalex.org/W2963899908","https://openalex.org/W2964120214","https://openalex.org/W2964187781","https://openalex.org/W2964308564","https://openalex.org/W2965848243","https://openalex.org/W2981586349","https://openalex.org/W2988823324","https://openalex.org/W2998825242","https://openalex.org/W4299801216","https://openalex.org/W4303633609","https://openalex.org/W4385245566","https://openalex.org/W6630875275","https://openalex.org/W6631190155","https://openalex.org/W6631516269","https://openalex.org/W6636510571","https://openalex.org/W6638318767","https://openalex.org/W6638742206","https://openalex.org/W6676647902","https://openalex.org/W6678470764","https://openalex.org/W6679434410","https://openalex.org/W6684191040","https://openalex.org/W6684821475","https://openalex.org/W6685183736","https://openalex.org/W6697449767","https://openalex.org/W6732742072","https://openalex.org/W6739901393","https://openalex.org/W6740863234"],"related_works":["https://openalex.org/W4387561393","https://openalex.org/W3163481960","https://openalex.org/W3093895509","https://openalex.org/W4283526844","https://openalex.org/W280704926","https://openalex.org/W2476068070","https://openalex.org/W4323971310","https://openalex.org/W2893372175","https://openalex.org/W2323394100","https://openalex.org/W1972827106"],"abstract_inverted_index":{"Image-text":[0],"matching":[1],"is":[2,97],"an":[3],"attractive":[4],"research":[5],"topic":[6],"in":[7,28,126],"the":[8,19,48,60,66,71,83,87,101,113,127,136,151,157,170,203],"community":[9],"of":[10,107,115],"vision":[11],"and":[12,24,33,64,109,153,160,177,194],"language.":[13],"The":[14],"key":[15],"element":[16],"to":[17,30,42,46,58,69,99,120,134,168],"narrow":[18],"\u201cheterogeneity":[20],"gap\u201d":[21],"between":[22],"visual":[23],"textual":[25],"data":[26],"lies":[27],"how":[29],"learn":[31,135],"powerful":[32],"robust":[34],"representations":[35,138],"for":[36,122,191],"both":[37,105,175],"modalities.":[38],"This":[39],"paper":[40],"proposes":[41],"alleviate":[43],"this":[44],"issue":[45],"achieve":[47,202],"fine-grained":[49],"visual-textual":[50],"alignment":[51],"from":[52,104],"two":[53,207],"aspects:":[54],"exploiting":[55],"attention":[56],"mechanism":[57],"locate":[59],"semantically":[61,188],"meaningful":[62],"portion":[63],"leveraging":[65],"memory":[67,158],"network":[68],"capture":[70],"long-term":[72,116],"contextual":[73,117],"knowledge.":[74],"Unlike":[75],"most":[76],"existing":[77],"studies":[78],"sorely":[79],"focus":[80],"on":[81,206],"exploring":[82],"cross-modal":[84,165],"associations":[85],"at":[86],"fragment":[88,108],"level,":[89],"our":[90,184,199],"designed":[91],"Collaborative":[92],"Dual":[93],"Attention":[94],"(CDA)":[95],"module":[96],"able":[98],"model":[100,200],"semantic":[102],"interdependencies":[103],"perspectives":[106],"channel.":[110],"Furthermore,":[111],"considering":[112],"usage":[114],"knowledge":[118],"contributes":[119],"compensate":[121],"detailed":[123],"semantics":[124,167],"concealed":[125],"rarely":[128],"appeared":[129],"image-text":[130],"pairs,":[131],"we":[132],"present":[133],"joint":[137],"by":[139],"constructing":[140],"a":[141,181],"Multi-Modal":[142],"Memory":[143],"Enhancement":[144],"(M3E)":[145],"module.":[146],"Specifically,":[147],"it":[148],"sequentially":[149],"restores":[150],"intra-modal":[152],"multi-modal":[154],"information":[155],"into":[156,180],"items,":[159],"they":[161],"conversely":[162],"persistently":[163],"memorize":[164],"shared":[166],"improve":[169],"latent":[171],"embeddings.":[172],"By":[173],"incorporating":[174],"CDA":[176],"M3E":[178],"modules":[179],"deep":[182],"architecture,":[183],"approach":[185],"generates":[186],"more":[187],"consistent":[189],"embeddings":[190],"representing":[192],"images":[193],"texts.":[195],"Extensive":[196],"experiments":[197],"demonstrate":[198],"can":[201],"state-of-the-art":[204],"results":[205],"public":[208],"benchmark":[209],"datasets.":[210]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":4}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
