{"id":"https://openalex.org/W4414857288","doi":"https://doi.org/10.48550/arxiv.2505.24456","title":"CaMMT: Benchmarking Culturally Aware Multimodal Machine Translation","display_name":"CaMMT: Benchmarking Culturally Aware Multimodal Machine Translation","publication_year":2025,"publication_date":"2025-05-30","ids":{"openalex":"https://openalex.org/W4414857288","doi":"https://doi.org/10.48550/arxiv.2505.24456"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2505.24456","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.24456","pdf_url":"https://arxiv.org/pdf/2505.24456","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2505.24456","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5095084148","display_name":"Emilio Villa-Cueva","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Villa-Cueva, Emilio","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119862493","display_name":"Sholpan Bolatzhanova","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bolatzhanova, Sholpan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075508196","display_name":"Diana Turmakhan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Turmakhan, Diana","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119862494","display_name":"Kareem Elzeky","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Elzeky, Kareem","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099096834","display_name":"Henok Biadglign Ademtew","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ademtew, Henok Biadglign","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112924039","display_name":"Alham Fikri Aji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aji, Alham Fikri","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058447624","display_name":"Vladimir Araujo","orcid":"https://orcid.org/0000-0001-5760-8410"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Araujo, Vladimir","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013873474","display_name":"Israel Abebe Azime","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Azime, Israel Abebe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013449404","display_name":"Jinheon Baek","orcid":"https://orcid.org/0000-0002-9367-560X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baek, Jinheon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000223765","display_name":"Frederico Belcavello","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Belcavello, Frederico","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119862492","display_name":"Fermin Cristobal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cristobal, Fermin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048793278","display_name":"Jan Christian Blaise Cruz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cruz, Jan Christian Blaise","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114847407","display_name":"Mary Dabre","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dabre, Mary","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077362985","display_name":"Raj Dabre","orcid":"https://orcid.org/0000-0003-0664-3421"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dabre, Raj","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019079656","display_name":"Toqeer Ehsan","orcid":"https://orcid.org/0000-0002-6724-6705"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ehsan, Toqeer","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084495633","display_name":"Naome A. Etori","orcid":"https://orcid.org/0000-0001-7772-1103"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Etori, Naome A","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093278345","display_name":"Fauzan Farooqui","orcid":"https://orcid.org/0009-0000-7939-3692"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Farooqui, Fauzan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073054282","display_name":"Jiahui Geng","orcid":"https://orcid.org/0000-0002-4205-8230"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Geng, Jiahui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095765182","display_name":"Guido Ivetta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ivetta, Guido","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104199197","display_name":"Thanmay Jayakumar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jayakumar, Thanmay","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088628107","display_name":"Soyeong Jeong","orcid":"https://orcid.org/0000-0003-3428-0365"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jeong, Soyeong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043522247","display_name":"Zheng Wei Lim","orcid":"https://orcid.org/0000-0003-1307-2399"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lim, Zheng Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065667092","display_name":"Aishik Mandal","orcid":"https://orcid.org/0009-0007-1056-2110"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mandal, Aishik","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Martinelli, Sofia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Martinelli, Sofia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112275730","display_name":"Mihail Mihaylov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mihaylov, Mihail Minkov","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000211688","display_name":"Daniil Orel","orcid":"https://orcid.org/0009-0007-5600-7032"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Orel, Daniil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041415557","display_name":"Aniket Pramanick","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pramanick, Aniket","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090787541","display_name":"Sukannya Purkayastha","orcid":"https://orcid.org/0000-0002-7559-0522"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Purkayastha, Sukannya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065946161","display_name":"Israfel Salazar","orcid":"https://orcid.org/0000-0001-9360-0192"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Salazar, Israfel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033608663","display_name":"Haiyue Song","orcid":"https://orcid.org/0000-0003-1159-0918"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Haiyue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048013691","display_name":"Tiago Timponi Torrent","orcid":"https://orcid.org/0000-0001-5373-2297"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Torrent, Tiago Timponi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114653388","display_name":"Debela Desalegn Yadeta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yadeta, Debela Desalegn","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004299578","display_name":"Injy Hamed","orcid":"https://orcid.org/0000-0002-9171-9461"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hamed, Injy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069871289","display_name":"Atnafu Lambebo Tonja","orcid":"https://orcid.org/0000-0002-3501-5136"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tonja, Atnafu Lambebo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5047351656","display_name":"Thamar Solorio","orcid":"https://orcid.org/0000-0002-3541-9405"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Solorio, Thamar","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":35,"corresponding_author_ids":["https://openalex.org/A5095084148"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9466999769210815,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9413999915122986,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.7706999778747559},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7418000102043152},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.659500002861023},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.651199996471405},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5228999853134155},{"id":"https://openalex.org/keywords/visual-language","display_name":"Visual language","score":0.35530000925064087},{"id":"https://openalex.org/keywords/language-understanding","display_name":"Language understanding","score":0.33059999346733093}],"concepts":[{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.7706999778747559},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7529000043869019},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7418000102043152},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.659500002861023},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.651199996471405},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5741999745368958},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5577999949455261},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5228999853134155},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.36820000410079956},{"id":"https://openalex.org/C2780878386","wikidata":"https://www.wikidata.org/wiki/Q1659648","display_name":"Visual language","level":2,"score":0.35530000925064087},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.33059999346733093},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.3190000057220459},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.3156000077724457},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3149999976158142},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.30469998717308044},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3010999858379364},{"id":"https://openalex.org/C146047270","wikidata":"https://www.wikidata.org/wiki/Q469666","display_name":"Human\u2013machine system","level":2,"score":0.2906999886035919},{"id":"https://openalex.org/C2992975276","wikidata":"https://www.wikidata.org/wiki/Q11042","display_name":"Cultural background","level":4,"score":0.2802000045776367},{"id":"https://openalex.org/C24687705","wikidata":"https://www.wikidata.org/wiki/Q3753284","display_name":"Example-based machine translation","level":3,"score":0.27309998869895935},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.25209999084472656}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2505.24456","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.24456","pdf_url":"https://arxiv.org/pdf/2505.24456","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2505.24456","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2505.24456","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2505.24456","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.24456","pdf_url":"https://arxiv.org/pdf/2505.24456","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Translating":[0],"cultural":[1,40,128],"content":[2],"poses":[3],"challenges":[4],"for":[5],"machine":[6],"translation":[7,93,121],"systems":[8,122],"due":[9],"to":[10,22,26,112,116],"the":[11],"differences":[12],"in":[13,42,61,76,96],"conceptualizations":[14],"between":[15],"cultures,":[16],"where":[17],"language":[18],"alone":[19],"may":[20],"fail":[21],"convey":[23],"sufficient":[24],"context":[25,41,90],"capture":[27],"region-specific":[28],"meanings.":[29],"In":[30],"this":[31,67],"work,":[32],"we":[33,69,86],"investigate":[34],"whether":[35],"images":[36,56],"can":[37],"act":[38],"as":[39],"multimodal":[43,120],"translation.":[44],"We":[45],"introduce":[46],"CaMMT,":[47,108],"a":[48],"human-curated":[49],"benchmark":[50],"of":[51,55],"over":[52],"5,800":[53],"triples":[54],"along":[57],"with":[58,127],"parallel":[59],"captions":[60],"English":[62],"and":[63,78,83,102,118,130],"regional":[64,131],"languages.":[65],"Using":[66],"dataset,":[68],"evaluate":[70,119],"five":[71],"Vision":[72],"Language":[73],"Models":[74],"(VLMs)":[75],"text-only":[77],"text+image":[79],"settings.":[80],"Through":[81],"automatic":[82],"human":[84],"evaluations,":[85],"find":[87],"that":[88,123],"visual":[89],"generally":[91],"improves":[92],"quality,":[94],"especially":[95],"handling":[97],"Culturally-Specific":[98],"Items":[99],"(CSIs),":[100],"disambiguation,":[101],"correct":[103],"gender":[104],"marking.":[105],"By":[106],"releasing":[107],"our":[109],"objective":[110],"is":[111],"support":[113],"broader":[114],"efforts":[115],"build":[117],"are":[124],"better":[125],"aligned":[126],"nuance":[129],"variations.":[132]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2025-10-10T00:00:00"}
