{"id":"https://openalex.org/W7155086535","doi":"https://doi.org/10.48550/arxiv.2604.18027","title":"CodePivot: Bootstrapping Multilingual Transpilation in LLMs via Reinforcement Learning without Parallel Corpora","display_name":"CodePivot: Bootstrapping Multilingual Transpilation in LLMs via Reinforcement Learning without Parallel Corpora","publication_year":2026,"publication_date":"2026-04-20","ids":{"openalex":"https://openalex.org/W7155086535","doi":"https://doi.org/10.48550/arxiv.2604.18027"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.18027","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18027","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.18027","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113364867","display_name":"Shangyu Li","orcid":"https://orcid.org/0000-0003-1426-9206"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Shangyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134207130","display_name":"Juyong Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Juyong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134162301","display_name":"Meibo Ren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Meibo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134116878","display_name":"Sizhe Zhong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhong, Sizhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128280187","display_name":"Huiri TAN","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tan, Huiri","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070721407","display_name":"Yunhao Gou","orcid":"https://orcid.org/0000-0002-1352-794X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gou, Yunhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134151980","display_name":"Xu Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Xu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024635381","display_name":"Chun Yong Chong","orcid":"https://orcid.org/0000-0003-1164-0049"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chong, Chun Yong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134146041","display_name":"Yun Peng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Yun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5024117197","display_name":"Jiasi Shen","orcid":"https://orcid.org/0000-0002-5904-3641"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Jiasi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.3066999912261963,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.3066999912261963,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.18050000071525574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.06650000065565109,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6310999989509583},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.6093999743461609},{"id":"https://openalex.org/keywords/bootstrapping","display_name":"Bootstrapping (finance)","score":0.4916999936103821},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.46959999203681946},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.3864000141620636},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.36250001192092896},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.357699990272522}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8442000150680542},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6310999989509583},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.609499990940094},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.6093999743461609},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.54830002784729},{"id":"https://openalex.org/C207609745","wikidata":"https://www.wikidata.org/wiki/Q4944086","display_name":"Bootstrapping (finance)","level":2,"score":0.4916999936103821},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48570001125335693},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.46959999203681946},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.3864000141620636},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.357699990272522},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.3562000095844269},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.34439998865127563},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.32589998841285706},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.2867000102996826},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.28279998898506165},{"id":"https://openalex.org/C109747225","wikidata":"https://www.wikidata.org/wiki/Q815758","display_name":"Scarcity","level":2,"score":0.25450000166893005}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.18027","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18027","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.18027","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18027","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Transpilation,":[0],"or":[1],"code":[2,8,45,234],"translation,":[3],"aims":[4],"to":[5,14,28,62,98,114,158],"convert":[6],"source":[7],"from":[9,23,67,124],"one":[10],"programming":[11],"language":[12,36],"(PL)":[13],"another.":[15],"It":[16,194],"is":[17,77,107],"beneficial":[18],"for":[19,31,44,110],"many":[20],"downstream":[21],"applications,":[22],"modernizing":[24],"large":[25,35],"legacy":[26],"codebases":[27],"augmenting":[29],"data":[30,236],"low-resource":[32,83,111,190],"PLs.":[33,84,104],"Recent":[34],"model":[37],"(LLM)-based":[38],"approaches":[39,88],"have":[40],"demonstrated":[41],"immense":[42],"potential":[43],"translation.":[46],"Among":[47],"these":[48,121,133],"approaches,":[49],"training-based":[50,87],"methods":[51,122],"are":[52,237],"particularly":[53,108],"important":[54],"because":[55],"LLMs":[56],"currently":[57],"do":[58],"not":[59],"effectively":[60],"adapt":[61],"domain-specific":[63],"settings":[64],"that":[65,141,174],"suffer":[66,123],"a":[68,91,100,115,138,151],"lack":[69],"of":[70,103,117,202],"knowledge":[71],"without":[72,165],"targeted":[73],"training.":[74],"This":[75,105],"limitation":[76,106],"evident":[78],"in":[79],"transpilation":[80,93,163,192,231],"tasks":[81,213,228],"involving":[82,170],"However,":[85],"existing":[86],"rely":[89],"on":[90,180,211,226,229],"pairwise":[92],"paradigm,":[94],"making":[95],"it":[96,220],"impractical":[97],"support":[99],"diverse":[101],"range":[102],"prominent":[109],"PLs":[112,172],"due":[113],"scarcity":[116],"training":[118,139],"data.":[119],"Furthermore,":[120],"suboptimal":[125],"reinforcement":[126],"learning":[127],"(RL)":[128],"reward":[129,154],"formulations.":[130],"To":[131],"address":[132],"limitations,":[134],"we":[135],"propose":[136],"CodePivot,":[137],"framework":[140],"leverages":[142],"Python":[143],"as":[144,207],"an":[145],"intermediate":[146],"representation":[147],"(IR),":[148],"augmented":[149],"by":[150],"novel":[152],"RL":[153],"mechanism,":[155],"Aggressive-Partial-Functional":[156],"reward,":[157],"bootstrap":[159],"the":[160,175],"model's":[161],"multilingual":[162],"ability":[164],"requiring":[166],"parallel":[167],"corpora.":[168],"Experiments":[169],"10":[171],"show":[173],"resulting":[176],"7B":[177],"model,":[178],"trained":[179,224],"Python-to-Others":[181,212],"tasks,":[182,216],"consistently":[183],"improves":[184],"performance":[185],"across":[186],"both":[187],"general":[188,230],"and":[189,209,214,235],"PL-related":[191],"tasks.":[193,232],"outperforms":[195,221],"substantially":[196],"larger":[197],"mainstream":[198],"models":[199],"with":[200],"hundreds":[201],"billions":[203],"more":[204],"parameters,":[205],"such":[206],"Deepseek-R1":[208],"Qwen3-235B-A22B-Instruct-2507,":[210],"Others-to-All":[215],"respectively.":[217],"In":[218],"addition,":[219],"its":[222],"counterpart":[223],"directly":[225],"Any-to-Any":[227],"The":[233],"available":[238],"at":[239],"https://github.com/lishangyu-hkust/CodePivot.":[240]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-22T00:00:00"}
