{"id":"https://openalex.org/W7123501894","doi":"https://doi.org/10.48550/arxiv.2601.06307","title":"A Rising Tide Lifts All Boats: MTQE Rewards for Idioms Improve General Translation Quality","display_name":"A Rising Tide Lifts All Boats: MTQE Rewards for Idioms Improve General Translation Quality","publication_year":2026,"publication_date":"2026-01-09","ids":{"openalex":"https://openalex.org/W7123501894","doi":"https://doi.org/10.48550/arxiv.2601.06307"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.06307","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.06307","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.06307","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5099230662","display_name":"Ishika Agarwal","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Agarwal, Ishika","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122924349","display_name":"Zhenlin He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Zhenlin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022983948","display_name":"Dhruva Patil","orcid":"https://orcid.org/0000-0001-6045-4977"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Patil, Dhruva","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5122936747","display_name":"Dilek Hakkani-T\u00fcr","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hakkani-T\u00fcr, Dilek","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5099230662"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11148","display_name":"Language, Metaphor, and Cognition","score":0.28130000829696655,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11148","display_name":"Language, Metaphor, and Cognition","score":0.28130000829696655,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.25049999356269836,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.03550000116229057,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/literal-translation","display_name":"Literal translation","score":0.7531999945640564},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.7275999784469604},{"id":"https://openalex.org/keywords/literal-and-figurative-language","display_name":"Literal and figurative language","score":0.699999988079071},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.6237000226974487},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5965999960899353},{"id":"https://openalex.org/keywords/literal","display_name":"Literal (mathematical logic)","score":0.45249998569488525},{"id":"https://openalex.org/keywords/example-based-machine-translation","display_name":"Example-based machine translation","score":0.4440000057220459},{"id":"https://openalex.org/keywords/machine-translation-software-usability","display_name":"Machine translation software usability","score":0.4244000017642975}],"concepts":[{"id":"https://openalex.org/C2777761643","wikidata":"https://www.wikidata.org/wiki/Q1191837","display_name":"Literal translation","level":3,"score":0.7531999945640564},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.7275999784469604},{"id":"https://openalex.org/C46182478","wikidata":"https://www.wikidata.org/wiki/Q7363315","display_name":"Literal and figurative language","level":2,"score":0.699999988079071},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6664999723434448},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6503000259399414},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.6237000226974487},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6096000075340271},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5965999960899353},{"id":"https://openalex.org/C2780882242","wikidata":"https://www.wikidata.org/wiki/Q14235582","display_name":"Literal (mathematical logic)","level":2,"score":0.45249998569488525},{"id":"https://openalex.org/C24687705","wikidata":"https://www.wikidata.org/wiki/Q3753284","display_name":"Example-based machine translation","level":3,"score":0.4440000057220459},{"id":"https://openalex.org/C148526163","wikidata":"https://www.wikidata.org/wiki/Q6723733","display_name":"Machine translation software usability","level":4,"score":0.4244000017642975},{"id":"https://openalex.org/C519982507","wikidata":"https://www.wikidata.org/wiki/Q1568","display_name":"Hindi","level":2,"score":0.38119998574256897},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.3619999885559082},{"id":"https://openalex.org/C110046852","wikidata":"https://www.wikidata.org/wiki/Q468495","display_name":"Computer-assisted translation","level":3,"score":0.34040001034736633},{"id":"https://openalex.org/C2986862884","wikidata":"https://www.wikidata.org/wiki/Q7553","display_name":"Language translation","level":3,"score":0.33899998664855957},{"id":"https://openalex.org/C98199350","wikidata":"https://www.wikidata.org/wiki/Q978442","display_name":"Dynamic and formal equivalence","level":3,"score":0.32760000228881836},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.32100000977516174},{"id":"https://openalex.org/C51802942","wikidata":"https://www.wikidata.org/wiki/Q7662211","display_name":"Synchronous context-free grammar","level":4,"score":0.30309998989105225},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2734000086784363},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.25679999589920044},{"id":"https://openalex.org/C135784402","wikidata":"https://www.wikidata.org/wiki/Q6958279","display_name":"Evaluation of machine translation","level":5,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.06307","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.06307","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.06307","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.06307","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8209361433982849,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Non-compositional":[0],"expressions":[1,26],"(e.g.,":[2],"idioms,":[3],"proverbs,":[4],"and":[5,31,35,74,96,119,128],"metaphors)":[6],"pose":[7],"significant":[8],"challenges":[9],"for":[10,122],"neural":[11],"machine":[12],"translation":[13,40,82,90,98,117],"systems":[14],"because":[15],"their":[16],"meanings":[17],"cannot":[18],"be":[19],"derived":[20],"from":[21],"individual":[22],"words":[23],"alone.":[24],"These":[25],"encode":[27],"rich,":[28],"cultural":[29],"meaning,":[30],"have":[32],"both":[33],"figurative":[34,129],"literal":[36],"meanings,":[37],"making":[38],"accurate":[39],"difficult.":[41],"Because":[42],"models":[43,61,67],"are":[44],"fairly":[45],"good":[46],"at":[47],"translating":[48],"compositional":[49],"text,":[50],"we":[51,78],"investigate":[52],"GRPO-style":[53],"fine-tuning":[54],"using":[55],"Machine":[56],"Translation":[57],"Quality":[58],"Estimation":[59],"(MTQE)":[60],"as":[62],"reward":[63],"functions":[64],"to":[65,68],"train":[66],"better":[69],"translate":[70],"idioms.":[71],"Using":[72],"Chinese":[73],"Hindi":[75],"idiom":[76,81],"datasets,":[77],"find":[79],"that":[80],"abilities":[83,99],"improve":[84],"by":[85,93,108],"~14":[86],"points,":[87,95],"general,":[88],"non-idiomatic":[89],"implicitly":[91],"improves":[92,107],"~8":[94],"cross-lingual":[97],"(trained":[100],"on":[101,105],"one":[102],"language,":[103],"evaluated":[104],"another)":[106],"~6":[109],"points.":[110],"Overall,":[111],"our":[112],"work":[113],"quantifies":[114],"the":[115],"non-compositional":[116],"gap":[118],"offers":[120],"insights":[121],"developing":[123],"LLMs":[124],"with":[125],"stronger":[126],"cross-cultural":[127],"language":[130],"understanding.":[131]},"counts_by_year":[],"updated_date":"2026-01-14T23:44:37.837170","created_date":"2026-01-14T00:00:00"}
