{"id":"https://openalex.org/W3072820880","doi":"https://doi.org/10.1109/tcsvt.2020.3017344","title":"CMPD: Using Cross Memory Network With Pair Discrimination for Image-Text Retrieval","display_name":"CMPD: Using Cross Memory Network With Pair Discrimination for Image-Text Retrieval","publication_year":2020,"publication_date":"2020-08-17","ids":{"openalex":"https://openalex.org/W3072820880","doi":"https://doi.org/10.1109/tcsvt.2020.3017344","mag":"3072820880"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2020.3017344","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2020.3017344","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100636282","display_name":"Xin Wen","orcid":"https://orcid.org/0000-0003-1937-1875"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xin Wen","raw_affiliation_strings":["School of Software, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Software, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068597652","display_name":"Zhizhong Han","orcid":"https://orcid.org/0000-0001-9540-9973"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhizhong Han","raw_affiliation_strings":["University of Maryland at College Park, College Park, MD, USA"],"affiliations":[{"raw_affiliation_string":"University of Maryland at College Park, College Park, MD, USA","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101691399","display_name":"Yu-Shen Liu","orcid":"https://orcid.org/0000-0001-7305-1915"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu-Shen Liu","raw_affiliation_strings":["School of Software, BNRist, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Software, BNRist, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100636282"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":2.2471,"has_fulltext":false,"cited_by_count":31,"citation_normalized_percentile":{"value":0.90039995,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"31","issue":"6","first_page":"2427","last_page":"2437"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7866050004959106},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6563423275947571},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6561052799224854},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5688363909721375},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5437816381454468},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5366093516349792},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5279254913330078},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5203827619552612},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.4540790021419525},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42716124653816223},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.426181435585022}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7866050004959106},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6563423275947571},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6561052799224854},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5688363909721375},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5437816381454468},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5366093516349792},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5279254913330078},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5203827619552612},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.4540790021419525},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42716124653816223},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.426181435585022},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2020.3017344","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2020.3017344","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6800000071525574,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G4158542089","display_name":null,"funder_award_id":"TC190A4DA/3","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G4233802299","display_name":null,"funder_award_id":"2019YFB1405703","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G4353192804","display_name":null,"funder_award_id":"2018YFB0505400","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G6766780905","display_name":null,"funder_award_id":"61672307","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":69,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1523385540","https://openalex.org/W1811254738","https://openalex.org/W1832693441","https://openalex.org/W1861492603","https://openalex.org/W1905882502","https://openalex.org/W1916445035","https://openalex.org/W1949478088","https://openalex.org/W1964073652","https://openalex.org/W2005666090","https://openalex.org/W2007972815","https://openalex.org/W2013535308","https://openalex.org/W2015175493","https://openalex.org/W2070753207","https://openalex.org/W2099471712","https://openalex.org/W2100235303","https://openalex.org/W2119775030","https://openalex.org/W2138118304","https://openalex.org/W2138493131","https://openalex.org/W2144407188","https://openalex.org/W2164530430","https://openalex.org/W2184188583","https://openalex.org/W2211092169","https://openalex.org/W2287451110","https://openalex.org/W2294512729","https://openalex.org/W2549070563","https://openalex.org/W2557865186","https://openalex.org/W2564325886","https://openalex.org/W2574447816","https://openalex.org/W2588534625","https://openalex.org/W2591669147","https://openalex.org/W2604394529","https://openalex.org/W2604880013","https://openalex.org/W2605359214","https://openalex.org/W2606965845","https://openalex.org/W2733636222","https://openalex.org/W2752345995","https://openalex.org/W2765440071","https://openalex.org/W2775288145","https://openalex.org/W2790362762","https://openalex.org/W2795832645","https://openalex.org/W2889024947","https://openalex.org/W2945578092","https://openalex.org/W2962706528","https://openalex.org/W2962879692","https://openalex.org/W2963187862","https://openalex.org/W2963389687","https://openalex.org/W2963466847","https://openalex.org/W2963467339","https://openalex.org/W2964130424","https://openalex.org/W2964216321","https://openalex.org/W2964430790","https://openalex.org/W2967957126","https://openalex.org/W4295521014","https://openalex.org/W4299412574","https://openalex.org/W4320013936","https://openalex.org/W6631190155","https://openalex.org/W6631216910","https://openalex.org/W6638742206","https://openalex.org/W6639102338","https://openalex.org/W6686207219","https://openalex.org/W6697020685","https://openalex.org/W6730042849","https://openalex.org/W6732292492","https://openalex.org/W6735913928","https://openalex.org/W6735953149","https://openalex.org/W6736114314","https://openalex.org/W6746775625","https://openalex.org/W6779669310"],"related_works":["https://openalex.org/W73545470","https://openalex.org/W4224266612","https://openalex.org/W2383394264","https://openalex.org/W4320153225","https://openalex.org/W4293261942","https://openalex.org/W3125968744","https://openalex.org/W2167701463","https://openalex.org/W2110287964","https://openalex.org/W4307407935","https://openalex.org/W649759291"],"abstract_inverted_index":{"Cross-modal":[0],"retrieval":[1,20],"using":[2],"deep":[3],"neural":[4],"networks":[5],"aims":[6,133],"to":[7,34,111,134,145],"retrieve":[8],"relevant":[9],"data":[10],"between":[11,66],"the":[12,30,36,43,47,67,73,93,102,113,141,159,177],"two":[13,25],"different":[14,117],"modalities.":[15,118],"The":[16],"performance":[17],"of":[18,29,108,152],"cross-modal":[19],"is":[21,59,120],"still":[22,55],"unsatisfactory":[23],"for":[24,63,87],"problems.":[26],"First,":[27,99],"most":[28],"previous":[31],"methods":[32],"failed":[33],"incorporate":[35],"common":[37,114],"knowledge":[38,115],"among":[39,116,162],"modalities":[40],"when":[41],"predicting":[42],"item":[44,153],"representations.":[45,137],"Second,":[46,138],"semantic":[48,160],"relationships":[49,161],"indicated":[50],"by":[51],"class":[52,150,167],"label":[53],"are":[54],"insufficiently":[56],"utilized,":[57],"which":[58,132,155],"an":[60],"important":[61],"clue":[62],"inferring":[64],"similarities":[65],"cross":[68,80,89,103],"modal":[69,90],"items.":[70],"To":[71],"address":[72],"above":[74],"issues,":[75],"we":[76,100,139],"propose":[77,101,140],"a":[78,106],"novel":[79],"memory":[81,104],"network":[82],"with":[83],"pair":[84,142],"discrimination":[85,143],"(CMPD)":[86],"image-text":[88,181],"retrieval,":[91],"where":[92],"main":[94],"contributions":[95],"lie":[96],"in":[97,180],"two-folds.":[98],"as":[105],"set":[107],"latent":[109],"concepts":[110],"capture":[112,158],"It":[119],"learnable":[121],"and":[122,149,166],"can":[123,156],"be":[124],"fused":[125],"into":[126],"each":[127],"modality":[128,147,164],"through":[129],"attention":[130],"mechanism,":[131],"discriminatively":[135],"predict":[136],"loss":[144],"discriminate":[146],"labels":[148,151,165],"pairs,":[154],"efficiently":[157],"these":[163],"labels.":[168],"Comprehensive":[169],"experimental":[170],"results":[171],"show":[172],"that":[173],"our":[174],"method":[175],"outperforms":[176],"state-of-the-art":[178],"approaches":[179],"retrieval.":[182]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
