{"id":"https://openalex.org/W7155177803","doi":"https://doi.org/10.48550/arxiv.2604.19144","title":"ReflectMT: Internalizing Reflection for Efficient and High-Quality Machine Translation","display_name":"ReflectMT: Internalizing Reflection for Efficient and High-Quality Machine Translation","publication_year":2026,"publication_date":"2026-04-21","ids":{"openalex":"https://openalex.org/W7155177803","doi":"https://doi.org/10.48550/arxiv.2604.19144"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.19144","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19144","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.19144","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125100224","display_name":"Kunquan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Kunquan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134233146","display_name":"Yingxue Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yingxue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134279799","display_name":"Fandong Meng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Meng, Fandong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134316668","display_name":"Jinsong Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Jinsong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.36559998989105225,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.36559998989105225,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3564999997615814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.035100001841783524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7401999831199646},{"id":"https://openalex.org/keywords/reflection","display_name":"Reflection (computer programming)","score":0.6883000135421753},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5680000185966492},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.5250999927520752},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.5048999786376953},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4097999930381775},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4072999954223633}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7401999831199646},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7347999811172485},{"id":"https://openalex.org/C65682993","wikidata":"https://www.wikidata.org/wiki/Q1056451","display_name":"Reflection (computer programming)","level":2,"score":0.6883000135421753},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6141999959945679},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5680000185966492},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.5250999927520752},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.5048999786376953},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46129998564720154},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4097999930381775},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4072999954223633},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.40459999442100525},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3817000091075897},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.3714999854564667},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.31369999051094055},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C98199350","wikidata":"https://www.wikidata.org/wiki/Q978442","display_name":"Dynamic and formal equivalence","level":3,"score":0.2597000002861023},{"id":"https://openalex.org/C86827895","wikidata":"https://www.wikidata.org/wiki/Q7098582","display_name":"Opportunistic reasoning","level":4,"score":0.25440001487731934}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.19144","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19144","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.19144","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19144","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"years":[1],"have":[2],"witnessed":[3],"growing":[4],"interest":[5],"in":[6,112,151,162],"applying":[7],"Large":[8],"Reasoning":[9],"Models":[10],"(LRMs)":[11],"to":[12,98],"Machine":[13],"Translation":[14],"(MT).":[15],"Existing":[16],"approaches":[17],"predominantly":[18],"adopt":[19],"a":[20,45,55,106,113,159],"\"think-first-then-translate\"":[21],"paradigm.":[22,57],"Although":[23],"explicit":[24,126],"reasoning":[25,127,146],"trajectories":[26],"significantly":[27],"enhance":[28],"translation":[29,52,115,164],"quality,":[30],"they":[31],"incur":[32],"prohibitive":[33],"inference":[34,143],"costs":[35],"and":[36,80,87,155],"latency.":[37],"To":[38],"address":[39],"these":[40],"limitations,":[41],"we":[42,72,94],"propose":[43],"ReflectMT,":[44],"two-stage":[46],"reflection":[47,79],"internalization":[48],"algorithm":[49],"for":[50,77],"machine":[51],"that":[53,137],"employs":[54],"\"translate-first-think-later\"":[56],"Our":[58],"approach":[59],"develops":[60],"the":[61,69,74,91,96,100,121],"model's":[62,75,139],"\"translate-reflect-refine\"":[63],"capability":[64],"through":[65],"reinforcement":[66],"learning.":[67],"In":[68,90],"first":[70,122],"stage,":[71,93],"cultivate":[73],"capacity":[76],"high-quality":[78,118],"refinement,":[81],"thereby":[82],"enhancing":[83],"its":[84],"semantic":[85],"comprehension":[86],"task-specific":[88],"knowledge.":[89],"second":[92],"train":[95],"model":[97],"internalize":[99],"knowledge":[101],"acquired":[102],"during":[103,108,142],"reflection.":[104],"As":[105],"result,":[107],"inference,":[109],"ReflectMT":[110],"operates":[111],"direct":[114],"mode,":[116],"producing":[117],"translations":[119,141],"on":[120,131],"attempt":[123],"without":[124],"any":[125],"steps.":[128],"Experimental":[129],"results":[130],"datasets":[132],"such":[133,148],"as":[134,149],"WMT24":[135],"demonstrate":[136],"our":[138],"first-pass":[140],"outperform":[144],"multi-step":[145],"LRMs":[147],"DeepSeek-R1":[150],"both":[152],"automatic":[153],"metrics":[154],"GPT-based":[156,163],"evaluation,":[157],"achieving":[158],"2.16-point":[160],"improvement":[161],"quality":[165],"evaluation":[166],"while":[167],"reducing":[168],"token":[169],"consumption":[170],"by":[171],"94.33%.":[172]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-23T00:00:00"}
