{"id":"https://openalex.org/W4400104719","doi":"https://doi.org/10.1145/3637528.3671787","title":"Improving the Consistency in Cross-Lingual Cross-Modal Retrieval with 1-to-K Contrastive Learning","display_name":"Improving the Consistency in Cross-Lingual Cross-Modal Retrieval with 1-to-K Contrastive Learning","publication_year":2024,"publication_date":"2024-08-24","ids":{"openalex":"https://openalex.org/W4400104719","doi":"https://doi.org/10.1145/3637528.3671787"},"language":"en","primary_location":{"id":"doi:10.1145/3637528.3671787","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3637528.3671787","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2406.18254","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043077962","display_name":"Zhijie Nie","orcid":"https://orcid.org/0009-0004-3933-0522"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhijie Nie","raw_affiliation_strings":["CCSE, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0004-3933-0522","affiliations":[{"raw_affiliation_string":"CCSE, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027015677","display_name":"Richong Zhang","orcid":"https://orcid.org/0000-0002-1207-0300"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Richong Zhang","raw_affiliation_strings":["CCSE, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-1207-0300","affiliations":[{"raw_affiliation_string":"CCSE, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071268429","display_name":"Zhangchi Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhangchi Feng","raw_affiliation_strings":["CCSE, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0005-2673-3784","affiliations":[{"raw_affiliation_string":"CCSE, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031578713","display_name":"Hailang Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hailang Huang","raw_affiliation_strings":["CCSE, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0009-3382-435X","affiliations":[{"raw_affiliation_string":"CCSE, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5104561219","display_name":"Xudong Liu","orcid":"https://orcid.org/0009-0007-8865-3055"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xudong Liu","raw_affiliation_strings":["CCSE, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0007-8865-3055","affiliations":[{"raw_affiliation_string":"CCSE, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5043077962"],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":0.9523,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.75449219,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"2272","last_page":"2283"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7451278567314148},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.6173240542411804},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5648599863052368},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5518341064453125},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5197581648826599},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.48370224237442017},{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.4415622353553772},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43743905425071716},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.4108165502548218},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3707091808319092},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15415465831756592},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.09666687250137329}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7451278567314148},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.6173240542411804},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5648599863052368},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5518341064453125},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5197581648826599},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.48370224237442017},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.4415622353553772},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43743905425071716},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.4108165502548218},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3707091808319092},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15415465831756592},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09666687250137329},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3637528.3671787","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3637528.3671787","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2406.18254","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.18254","pdf_url":"https://arxiv.org/pdf/2406.18254","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2406.18254","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.18254","pdf_url":"https://arxiv.org/pdf/2406.18254","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.800000011920929}],"awards":[{"id":"https://openalex.org/G1421742111","display_name":null,"funder_award_id":"U23B2056","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320329860","display_name":"National Science and Technology Major Project","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4400104719.pdf","grobid_xml":"https://content.openalex.org/works/W4400104719.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W1905882502","https://openalex.org/W2185175083","https://openalex.org/W2187089797","https://openalex.org/W2277195237","https://openalex.org/W2963527096","https://openalex.org/W2963778889","https://openalex.org/W3035390927","https://openalex.org/W3086105743","https://openalex.org/W3090449556","https://openalex.org/W3101864923","https://openalex.org/W3108655343","https://openalex.org/W3138516171","https://openalex.org/W3156636935","https://openalex.org/W3156892778","https://openalex.org/W3171975879","https://openalex.org/W3174010726","https://openalex.org/W3177654849","https://openalex.org/W3202415077","https://openalex.org/W3208314443","https://openalex.org/W4287326757","https://openalex.org/W4293567540","https://openalex.org/W4383877072","https://openalex.org/W6781120326"],"related_works":["https://openalex.org/W2118758177","https://openalex.org/W4330338194","https://openalex.org/W2153520307","https://openalex.org/W2151459719","https://openalex.org/W623261610","https://openalex.org/W2316630966","https://openalex.org/W3133744317","https://openalex.org/W2358294942","https://openalex.org/W2135622761","https://openalex.org/W4367460280"],"abstract_inverted_index":{"Cross-lingual":[0],"Cross-modal":[1],"Retrieval":[2],"(CCR)":[3],"is":[4],"an":[5],"essential":[6],"task":[7],"in":[8,26,71,83,97,103,120],"web":[9],"search,":[10],"which":[11,128,148],"aims":[12],"to":[13,78,172],"break":[14],"the":[15,27,48,67,72,92,104,114,174,203],"barriers":[16],"between":[17],"modality":[18],"and":[19,22,153,157,196],"language":[20,151],"simultaneously":[21],"achieves":[23],"image-text":[24],"retrieval":[25,60],"multi-lingual":[28],"scenario":[29],"with":[30,87,109,198],"a":[31,140,164],"single":[32],"model.":[33],"In":[34,160],"recent":[35],"years,":[36],"excellent":[37],"progress":[38],"has":[39],"been":[40],"made":[41],"based":[42,50],"on":[43,51,54,184],"cross-lingual":[44,73,88],"cross-modal":[45,75,110],"pre-training;":[46],"particularly,":[47],"methods":[49,64,70,86,108],"contrastive":[52,145],"learning":[53,146],"large-scale":[55],"data":[56],"have":[57],"significantly":[58],"improved":[59],"tasks.":[61],"However,":[62],"these":[63,136],"directly":[65],"follow":[66],"existing":[68],"pre-training":[69],"or":[74],"domain,":[76],"leading":[77],"two":[79],"problems":[80],"of":[81],"inconsistency":[82,176],"CCR:":[84],"The":[85,107],"style":[89,111],"suffer":[90,112],"from":[91,113],"intra-modal":[93],"error":[94,155],"propagation,":[95],"resulting":[96,119],"inconsistent":[98,121],"recall":[99,194],"performance":[100],"across":[101,123,177],"languages":[102,124,178],"whole":[105],"dataset.":[106],"inter-modal":[115],"optimization":[116,158],"direction":[117],"bias,":[118],"rank":[122,175],"within":[125,179],"each":[126,150,180],"instance,":[127],"cannot":[129],"be":[130],"reflected":[131],"by":[132],"Recall@K.":[133],"To":[134],"solve":[135],"problems,":[137],"we":[138,162],"propose":[139,163],"simple":[141],"but":[142],"effective":[143],"1-to-K":[144],"method,":[147],"treats":[149],"equally":[152],"eliminates":[154],"propagation":[156],"bias.":[159],"addition,":[161],"new":[165,204],"evaluation":[166],"metric,":[167],"Mean":[168],"Rank":[169],"Variance":[170],"(MRV),":[171],"reflect":[173],"instance.":[181],"Extensive":[182],"experiments":[183],"four":[185],"CCR":[186],"datasets":[187],"show":[188],"that":[189],"our":[190],"method":[191],"improves":[192],"both":[193],"rates":[195],"MRV":[197],"smaller-scale":[199],"pre-trained":[200],"data,":[201],"achieving":[202],"state-of-art.":[205]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2024-06-28T00:00:00"}
