{"id":"https://openalex.org/W4406115634","doi":"https://doi.org/10.1145/3704323.3704346","title":"Enhancing Pretrained Multilingual Machine Translation Model with Code-Switching: A Study on Chinese, English and Malay Language","display_name":"Enhancing Pretrained Multilingual Machine Translation Model with Code-Switching: A Study on Chinese, English and Malay Language","publication_year":2024,"publication_date":"2024-10-25","ids":{"openalex":"https://openalex.org/W4406115634","doi":"https://doi.org/10.1145/3704323.3704346"},"language":"en","primary_location":{"id":"doi:10.1145/3704323.3704346","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3704323.3704346","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 13th International Conference on Computing and Pattern Recognition","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3704323.3704346","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004929949","display_name":"Haijing Liu","orcid":"https://orcid.org/0009-0000-4772-9569"},"institutions":[{"id":"https://openalex.org/I4210138650","display_name":"Universiti Teknologi MARA System","ror":"https://ror.org/030847t23","country_code":"MY","type":"education","lineage":["https://openalex.org/I4210138650"]},{"id":"https://openalex.org/I4210115395","display_name":"Taiyuan Institute of Technology","ror":"https://ror.org/02d0fkx94","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210115395"]}],"countries":["CN","MY"],"is_corresponding":true,"raw_author_name":"Haijing Liu","raw_affiliation_strings":["College of Computing, Informatics and Mathematics, University Technology MARA, Shah Alam, Selangor, Malaysia, and","Department of Computer Engineering, Taiyuan Institute of Technology, Taiyuan, Shanxi, China","College of Computing, Informatics and Mathematics, University Technology MARA, Shah Alam, Selangor, Malaysia,"],"affiliations":[{"raw_affiliation_string":"College of Computing, Informatics and Mathematics, University Technology MARA, Shah Alam, Selangor, Malaysia, and","institution_ids":["https://openalex.org/I4210138650"]},{"raw_affiliation_string":"Department of Computer Engineering, Taiyuan Institute of Technology, Taiyuan, Shanxi, China","institution_ids":["https://openalex.org/I4210115395"]},{"raw_affiliation_string":"College of Computing, Informatics and Mathematics, University Technology MARA, Shah Alam, Selangor, Malaysia,","institution_ids":["https://openalex.org/I4210138650"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078214061","display_name":"Noraini Seman","orcid":"https://orcid.org/0000-0002-0661-4607"},"institutions":[{"id":"https://openalex.org/I4210138650","display_name":"Universiti Teknologi MARA System","ror":"https://ror.org/030847t23","country_code":"MY","type":"education","lineage":["https://openalex.org/I4210138650"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Noraini Seman","raw_affiliation_strings":["College of Computing, Informatics and Mathematics, University Technology MARA, Shah Alam, Selangor, Malaysia"],"affiliations":[{"raw_affiliation_string":"College of Computing, Informatics and Mathematics, University Technology MARA, Shah Alam, Selangor, Malaysia","institution_ids":["https://openalex.org/I4210138650"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5004929949"],"corresponding_institution_ids":["https://openalex.org/I4210115395","https://openalex.org/I4210138650"],"apc_list":null,"apc_paid":null,"fwci":0.3626,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.70551449,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"388","last_page":"393"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9726999998092651,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/malay","display_name":"Malay","score":0.955558717250824},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8490651249885559},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.7577791213989258},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6625216603279114},{"id":"https://openalex.org/keywords/code-switching","display_name":"Code-switching","score":0.6074857711791992},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5671690702438354},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4994673728942871},{"id":"https://openalex.org/keywords/language-translation","display_name":"Language translation","score":0.48702579736709595},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.48631271719932556},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.4365995228290558},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.36810439825057983}],"concepts":[{"id":"https://openalex.org/C2776938241","wikidata":"https://www.wikidata.org/wiki/Q9237","display_name":"Malay","level":2,"score":0.955558717250824},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8490651249885559},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.7577791213989258},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6625216603279114},{"id":"https://openalex.org/C18552078","wikidata":"https://www.wikidata.org/wiki/Q255615","display_name":"Code-switching","level":2,"score":0.6074857711791992},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5671690702438354},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4994673728942871},{"id":"https://openalex.org/C2986862884","wikidata":"https://www.wikidata.org/wiki/Q7553","display_name":"Language translation","level":3,"score":0.48702579736709595},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.48631271719932556},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.4365995228290558},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.36810439825057983},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3704323.3704346","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3704323.3704346","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 13th International Conference on Computing and Pattern Recognition","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3704323.3704346","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3704323.3704346","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 13th International Conference on Computing and Pattern Recognition","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.4099999964237213,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2756566411","https://openalex.org/W2896457183","https://openalex.org/W2933138175","https://openalex.org/W2936627440","https://openalex.org/W2954089321","https://openalex.org/W2970397112","https://openalex.org/W2997518171","https://openalex.org/W3001434439","https://openalex.org/W3034724424","https://openalex.org/W3035390927","https://openalex.org/W3090350559","https://openalex.org/W3169369929","https://openalex.org/W3200578235","https://openalex.org/W4206908526","https://openalex.org/W4285077564","https://openalex.org/W4299579390","https://openalex.org/W4385571785","https://openalex.org/W4390092938","https://openalex.org/W6739901393","https://openalex.org/W6744957266"],"related_works":["https://openalex.org/W2883671469","https://openalex.org/W2728761353","https://openalex.org/W2000013842","https://openalex.org/W4362495644","https://openalex.org/W2134714056","https://openalex.org/W4321065355","https://openalex.org/W2997015083","https://openalex.org/W3127743011","https://openalex.org/W2892009878","https://openalex.org/W2974285821"],"abstract_inverted_index":{"In":[0,84],"the":[1,13,17,50,64,69,74,82,88,97,104,130,135,140,143,148,160],"field":[2],"of":[3,52,73,81,92,106,114,154],"multilingual":[4,42,61],"machine":[5,43,56],"translation,":[6],"many":[7],"pretrained":[8,21,41],"language":[9],"models":[10,22],"have":[11],"achieved":[12],"inspiring":[14],"results.":[15],"However,":[16],"results":[18,105,141,161],"based":[19],"on":[20,87,110],"are":[23],"not":[24],"yet":[25],"very":[26],"satisfactory":[27],"for":[28],"low-resource":[29],"languages.":[30],"This":[31,121],"paper":[32,122],"investigates":[33],"how":[34],"to":[35,39,48,102,128,156],"leverage":[36],"code-switching":[37,65,98,144],"data":[38,99,131],"fine-tune":[40],"translation":[44],"model,":[45],"in":[46,132],"order":[47],"boost":[49],"performance":[51],"few-shot":[53],"low":[54],"resource":[55],"translation.":[57],"By":[58],"utilizing":[59],"a":[60],"mixed":[62],"corpus,":[63],"method":[66,101],"can":[67],"enhance":[68],"cross-linguistic":[70],"generalization":[71],"ability":[72],"model":[75,91,109,146],"and":[76,119,134],"improve":[77,147],"its":[78],"overall":[79],"understanding":[80],"language.":[83],"this":[85],"paper,":[86],"smaller":[89],"size":[90],"FLORES-101":[93],"benchmark,":[94],"we":[95],"use":[96],"augmentation":[100],"achieve":[103],"benchmark's":[107],"larger":[108],"six":[111],"direction":[112],"pairs":[113],"three":[115],"languages,":[116],"Chinese,":[117],"English":[118],"Malay.":[120],"studied":[123],"various":[124],"corpus":[125],"mixture":[126],"mechanisms":[127],"construct":[129],"code-switching,":[133],"experimental":[136],"findings":[137],"show":[138],"that":[139],"using":[142],"fine-tuning":[145],"spBLEU":[149],"score":[150],"by":[151],"an":[152],"average":[153],"2":[155],"3":[157],"points":[158],"over":[159],"without":[162],"code-switching.":[163]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
