{"id":"https://openalex.org/W3209163491","doi":"https://doi.org/10.1109/tip.2021.3123553","title":"Memorize, Associate and Match: Embedding Enhancement via Fine-Grained Alignment for Image-Text Retrieval","display_name":"Memorize, Associate and Match: Embedding Enhancement via Fine-Grained Alignment for Image-Text Retrieval","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3209163491","doi":"https://doi.org/10.1109/tip.2021.3123553","mag":"3209163491","pmid":"https://pubmed.ncbi.nlm.nih.gov/34739375"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2021.3123553","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2021.3123553","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047636121","display_name":"Jiangtong Li","orcid":"https://orcid.org/0000-0003-3873-4053"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiangtong Li","raw_affiliation_strings":["MOE Key Lab of Artificial Intelligence, Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China. (e-mail: jiangtongli1997@gmail.com)","Department of Computer Science and Engineering, MOE Key Laboratory of Artificial Intelligence, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MOE Key Lab of Artificial Intelligence, Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China. (e-mail: jiangtongli1997@gmail.com)","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, MOE Key Laboratory of Artificial Intelligence, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100324301","display_name":"Liu Liu","orcid":"https://orcid.org/0000-0003-4218-8008"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liu Liu","raw_affiliation_strings":["MOE Key Lab of Artificial Intelligence, Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China","Department of Computer Science and Engineering, MOE Key Laboratory of Artificial Intelligence, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MOE Key Lab of Artificial Intelligence, Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":[]},{"raw_affiliation_string":"Department of Computer Science and Engineering, MOE Key Laboratory of Artificial Intelligence, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032618817","display_name":"Li Niu","orcid":"https://orcid.org/0000-0003-1970-8634"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Niu","raw_affiliation_strings":["MOE Key Lab of Artificial Intelligence, Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China","Department of Computer Science and Engineering, MOE Key Laboratory of Artificial Intelligence, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MOE Key Lab of Artificial Intelligence, Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":[]},{"raw_affiliation_string":"Department of Computer Science and Engineering, MOE Key Laboratory of Artificial Intelligence, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100741568","display_name":"Liqing Zhang","orcid":"https://orcid.org/0000-0001-7597-8503"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liqing Zhang","raw_affiliation_strings":["MOE Key Lab of Artificial Intelligence, Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China","Department of Computer Science and Engineering, MOE Key Laboratory of Artificial Intelligence, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"MOE Key Lab of Artificial Intelligence, Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":[]},{"raw_affiliation_string":"Department of Computer Science and Engineering, MOE Key Laboratory of Artificial Intelligence, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5047636121"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":3.2663,"has_fulltext":false,"cited_by_count":41,"citation_normalized_percentile":{"value":0.93632353,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"30","issue":null,"first_page":"9193","last_page":"9207"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8083583116531372},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7867801189422607},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.6979246139526367},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6271041631698608},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5020897388458252},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.490337610244751},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4874858856201172},{"id":"https://openalex.org/keywords/visual-word","display_name":"Visual Word","score":0.4417819082736969},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.34915056824684143}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8083583116531372},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7867801189422607},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.6979246139526367},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6271041631698608},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5020897388458252},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.490337610244751},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4874858856201172},{"id":"https://openalex.org/C189391414","wikidata":"https://www.wikidata.org/wiki/Q7936579","display_name":"Visual Word","level":4,"score":0.4417819082736969},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.34915056824684143},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2021.3123553","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2021.3123553","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:34739375","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/34739375","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4118779427","display_name":null,"funder_award_id":"2018AAA0100704","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G5329974562","display_name":null,"funder_award_id":"2021SHZDZX0102","funder_id":"https://openalex.org/F4320311779","funder_display_name":"Shanghai Association for Science and Technology"},{"id":"https://openalex.org/G5660070723","display_name":null,"funder_award_id":"62076162","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320311779","display_name":"Shanghai Association for Science and Technology","ror":"https://ror.org/05j0k2q54"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":75,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1522301498","https://openalex.org/W1527575280","https://openalex.org/W1861492603","https://openalex.org/W1895989618","https://openalex.org/W1925193522","https://openalex.org/W1933349210","https://openalex.org/W2006409313","https://openalex.org/W2106277773","https://openalex.org/W2112912048","https://openalex.org/W2157364932","https://openalex.org/W2185175083","https://openalex.org/W2194775991","https://openalex.org/W2267186426","https://openalex.org/W2277195237","https://openalex.org/W2476624367","https://openalex.org/W2546696630","https://openalex.org/W2552579943","https://openalex.org/W2586050494","https://openalex.org/W2591669147","https://openalex.org/W2607579284","https://openalex.org/W2613718673","https://openalex.org/W2735608653","https://openalex.org/W2739759426","https://openalex.org/W2745461083","https://openalex.org/W2774267535","https://openalex.org/W2896457183","https://openalex.org/W2896798564","https://openalex.org/W2898403805","https://openalex.org/W2899771611","https://openalex.org/W2900953995","https://openalex.org/W2909384861","https://openalex.org/W2949847915","https://openalex.org/W2950527759","https://openalex.org/W2951008357","https://openalex.org/W2956335072","https://openalex.org/W2962954913","https://openalex.org/W2962964995","https://openalex.org/W2963115613","https://openalex.org/W2963341956","https://openalex.org/W2963403868","https://openalex.org/W2963448850","https://openalex.org/W2963499204","https://openalex.org/W2963954913","https://openalex.org/W2964015378","https://openalex.org/W2964081303","https://openalex.org/W2964121744","https://openalex.org/W2965848243","https://openalex.org/W2981586349","https://openalex.org/W2988823324","https://openalex.org/W2991539277","https://openalex.org/W2994818707","https://openalex.org/W2998215884","https://openalex.org/W3008356057","https://openalex.org/W3010277541","https://openalex.org/W3035454331","https://openalex.org/W3035605030","https://openalex.org/W3087516599","https://openalex.org/W3103717910","https://openalex.org/W4303633609","https://openalex.org/W4385245566","https://openalex.org/W6620707391","https://openalex.org/W6631190155","https://openalex.org/W6631516269","https://openalex.org/W6638318767","https://openalex.org/W6639102338","https://openalex.org/W6676647902","https://openalex.org/W6684821475","https://openalex.org/W6726873649","https://openalex.org/W6732742072","https://openalex.org/W6732958910","https://openalex.org/W6739901393","https://openalex.org/W6747225742","https://openalex.org/W6755207826","https://openalex.org/W6756040250"],"related_works":["https://openalex.org/W2063218608","https://openalex.org/W4386105885","https://openalex.org/W2312145515","https://openalex.org/W2184288218","https://openalex.org/W2947282851","https://openalex.org/W2374066281","https://openalex.org/W4387423606","https://openalex.org/W2071180033","https://openalex.org/W2036058638","https://openalex.org/W2528082075"],"abstract_inverted_index":{"Image-text":[0],"retrieval":[1,14,61,136],"aims":[2],"to":[3,32,59,87],"capture":[4,33],"the":[5,34,52,112,135],"semantic":[6],"correlation":[7],"between":[8,37,47],"images":[9,38],"and":[10,24,39,49,91],"texts.":[11,40],"Existing":[12],"image-text":[13,79],"methods":[15],"can":[16],"be":[17],"roughly":[18],"categorized":[19],"into":[20],"embedding":[21,94,127],"learning":[22,26,95],"paradigm":[23,30,43],"pair-wise":[25,56],"paradigm.":[27,96],"The":[28,41],"former":[29],"fails":[31],"fine-grained":[35,45,89],"correspondence":[36],"latter":[42],"achieves":[44],"alignment":[46,90],"regions":[48],"words,":[50],"but":[51,132],"high":[53],"cost":[54],"of":[55],"computation":[57],"leads":[58],"slow":[60],"speed.":[62],"In":[63,118],"this":[64,119],"paper,":[65],"we":[66,98],"propose":[67],"a":[68],"novel":[69],"method":[70],"named":[71],"MEMBER":[72,143],"by":[73],"using":[74],"Memory-based":[75],"EMBedding":[76],"Enhancement":[77],"for":[78],"Retrieval":[80],"(MEMBER),":[81],"which":[82],"introduces":[83],"global":[84],"memory":[85,116],"banks":[86],"enable":[88],"fusion":[92],"in":[93,111],"Specifically,":[97],"enrich":[99],"image":[100],"(resp.,":[101,107,114],"text)":[102],"features":[103,109],"with":[104],"relevant":[105],"text":[106,113],"image)":[108,115],"stored":[110],"bank.":[117],"way,":[120],"our":[121,142],"model":[122],"not":[123],"only":[124],"accomplishes":[125],"mutual":[126],"enhancement":[128],"across":[129],"two":[130,149],"modalities,":[131],"also":[133],"maintains":[134],"efficiency.":[137],"Extensive":[138],"experiments":[139],"demonstrate":[140],"that":[141],"remarkably":[144],"outperforms":[145],"state-of-the-art":[146],"approaches":[147],"on":[148],"large-scale":[150],"benchmark":[151],"datasets.":[152]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":18},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":7}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
