{"id":"https://openalex.org/W4399418626","doi":"https://doi.org/10.1145/3652583.3658018","title":"RetrievalMMT: Retrieval-Constrained Multi-Modal Prompt Learning for Multi-Modal Machine Translation","display_name":"RetrievalMMT: Retrieval-Constrained Multi-Modal Prompt Learning for Multi-Modal Machine Translation","publication_year":2024,"publication_date":"2024-05-30","ids":{"openalex":"https://openalex.org/W4399418626","doi":"https://doi.org/10.1145/3652583.3658018"},"language":"en","primary_location":{"id":"doi:10.1145/3652583.3658018","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3652583.3658018","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3658018","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3658018","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003748981","display_name":"Y Wang","orcid":"https://orcid.org/0009-0000-9403-2844"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yan Wang","raw_affiliation_strings":["South China University of Technology, Guangzhou, China"],"raw_orcid":"https://orcid.org/0009-0000-9403-2844","affiliations":[{"raw_affiliation_string":"South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101296394","display_name":"Zeng YaWen","orcid":"https://orcid.org/0000-0003-1908-1157"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yawen Zeng","raw_affiliation_strings":["ByteDance AI Lab, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-1908-1157","affiliations":[{"raw_affiliation_string":"ByteDance AI Lab, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114430015","display_name":"Junjie Liang","orcid":"https://orcid.org/0009-0006-7200-0749"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junjie Liang","raw_affiliation_strings":["South China University of Technology, Guangzhou, China"],"raw_orcid":"https://orcid.org/0009-0006-7200-0749","affiliations":[{"raw_affiliation_string":"South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036301580","display_name":"Xiaofen Xing","orcid":"https://orcid.org/0000-0002-0016-9055"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaofen Xing","raw_affiliation_strings":["South China University of Technology, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-0016-9055","affiliations":[{"raw_affiliation_string":"South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114357209","display_name":"Jin Xu","orcid":"https://orcid.org/0009-0001-8735-3532"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Xu","raw_affiliation_strings":["South China University of Technology &amp; Pazhou Lab, Guangzhou, China"],"raw_orcid":"https://orcid.org/0009-0001-8735-3532","affiliations":[{"raw_affiliation_string":"South China University of Technology &amp; Pazhou Lab, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007354180","display_name":"Xiangmin Xu","orcid":"https://orcid.org/0000-0003-4573-5820"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangmin Xu","raw_affiliation_strings":["South China University of Technology, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-4573-5820","affiliations":[{"raw_affiliation_string":"South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5003748981"],"corresponding_institution_ids":["https://openalex.org/I90610280"],"apc_list":null,"apc_paid":null,"fwci":0.7099,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.69477422,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"860","last_page":"868"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7886366248130798},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.7535594701766968},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.63539719581604},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5599462389945984},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5507763028144836},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.44531798362731934},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.42397406697273254},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3766184449195862},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10419508814811707}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7886366248130798},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.7535594701766968},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.63539719581604},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5599462389945984},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5507763028144836},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44531798362731934},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.42397406697273254},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3766184449195862},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10419508814811707},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3652583.3658018","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3652583.3658018","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3658018","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3652583.3658018","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3652583.3658018","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3658018","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2234319012","display_name":null,"funder_award_id":"62372187","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2993877962","display_name":null,"funder_award_id":"62372187","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"},{"id":"https://openalex.org/G5261590510","display_name":null,"funder_award_id":"2021YFC2202603","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"},{"id":"https://openalex.org/G6295744823","display_name":null,"funder_award_id":"2021YFC2202603","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323817","display_name":"Universitas Brawijaya","ror":"https://ror.org/01wk3d929"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4399418626.pdf","grobid_xml":"https://content.openalex.org/works/W4399418626.grobid-xml"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W2101105183","https://openalex.org/W2133512280","https://openalex.org/W2509282593","https://openalex.org/W2581101319","https://openalex.org/W2593341061","https://openalex.org/W2950207430","https://openalex.org/W2950886580","https://openalex.org/W2963909453","https://openalex.org/W3034027410","https://openalex.org/W3083614545","https://openalex.org/W3102475290","https://openalex.org/W3119746927","https://openalex.org/W3168900788","https://openalex.org/W3174570731","https://openalex.org/W3176471072","https://openalex.org/W3198377975","https://openalex.org/W4205991051","https://openalex.org/W4206119104","https://openalex.org/W4221155857","https://openalex.org/W4241499611","https://openalex.org/W4283399653","https://openalex.org/W4284688019","https://openalex.org/W4385573026","https://openalex.org/W4386799811","https://openalex.org/W6600299915"],"related_works":["https://openalex.org/W2385859805","https://openalex.org/W2530972254","https://openalex.org/W2775554247","https://openalex.org/W627697492","https://openalex.org/W2110168585","https://openalex.org/W3107474891","https://openalex.org/W2250213760","https://openalex.org/W4386247111","https://openalex.org/W4327642362","https://openalex.org/W2587014613"],"abstract_inverted_index":{"As":[0],"an":[1,32,87],"extension":[2],"of":[3,9,18,67,101,115,142],"machine":[4,11,150],"translation,":[5],"the":[6,16,45,99,111,127,140],"primary":[7],"objective":[8],"multi-modal":[10,27,79,102,128,144,149],"translation":[12,151],"is":[13,24,75],"to":[14,55,77,83,90,147],"optimize":[15],"utilization":[17],"visual":[19,61,92,112],"information.":[20],"Technically,":[21],"image":[22],"information":[23,93],"integrated":[25],"into":[26],"fusion":[28],"and":[29,64,86,134],"alignment":[30],"as":[31,131],"auxiliary":[33],"modality":[34,54],"through":[35],"concepts":[36,80],"or":[37,81],"latent":[38],"semantics,":[39],"which":[40],"are":[41,108],"typically":[42],"based":[43],"on":[44],"Transformer":[46],"framework.":[47,72],"However,":[48],"current":[49],"approaches":[50],"often":[51],"ignore":[52],"one":[53],"design":[56],"numerous":[57],"handcrafted":[58],"features":[59,82],"(e.g.":[60],"concept":[62],"extraction)":[63],"require":[65],"training":[66],"all":[68],"parameters":[69],"in":[70,126],"their":[71,119],"Therefore,":[73],"it":[74],"worthwhile":[76],"explore":[78],"enhance":[84],"performance":[85],"efficient":[88],"approach":[89],"incorporate":[91],"with":[94,98,110],"minimal":[95],"cost.":[96],"Meanwhile,":[97],"development":[100],"large":[103],"language":[104],"models":[105],"(MLLMs),":[106],"they":[107],"faced":[109],"hallucination":[113],"issue":[114],"compromising":[116],"performance,":[117],"despite":[118],"powerful":[120],"capabilities.":[121],"Inspired":[122],"by":[123],"pioneering":[124],"techniques":[125],"field,":[129],"such":[130],"prompt":[132,145],"learning":[133,146],"MLLMs,":[135],"this":[136,148],"paper":[137],"innovatively":[138],"explores":[139],"possibility":[141],"applying":[143],"task.":[152]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-04-29T09:16:38.111599","created_date":"2025-10-10T00:00:00"}
