{"id":"https://openalex.org/W4412889389","doi":"https://doi.org/10.18653/v1/2025.acl-srw.81","title":"Controlling Language Confusion in Multilingual LLMs","display_name":"Controlling Language Confusion in Multilingual LLMs","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412889389","doi":"https://doi.org/10.18653/v1/2025.acl-srw.81"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2025.acl-srw.81","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-srw.81","pdf_url":"https://aclanthology.org/2025.acl-srw.81.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 4: Student Research Workshop)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.acl-srw.81.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101846865","display_name":"Nahyun Lee","orcid":"https://orcid.org/0000-0002-8633-5519"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Nahyun Lee","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081158951","display_name":"Yeongseo Woo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yeongseo Woo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088036513","display_name":"Hyunwoo Ko","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hyunwoo Ko","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5028962243","display_name":"Guijin Son","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guijin Son","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101846865"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.7163,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.91490974,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1026","last_page":"1035"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10759","display_name":"Translation Studies and Practices","score":0.9628000259399414,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12881","display_name":"linguistics and terminology studies","score":0.9570000171661377,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/confusion","display_name":"Confusion","score":0.8515242338180542},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6255587339401245},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3725631833076477},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.18382585048675537},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.05743834376335144}],"concepts":[{"id":"https://openalex.org/C2781140086","wikidata":"https://www.wikidata.org/wiki/Q557945","display_name":"Confusion","level":2,"score":0.8515242338180542},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6255587339401245},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3725631833076477},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.18382585048675537},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.05743834376335144},{"id":"https://openalex.org/C11171543","wikidata":"https://www.wikidata.org/wiki/Q41630","display_name":"Psychoanalysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.acl-srw.81","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-srw.81","pdf_url":"https://aclanthology.org/2025.acl-srw.81.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 4: Student Research Workshop)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.acl-srw.81","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-srw.81","pdf_url":"https://aclanthology.org/2025.acl-srw.81.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 4: Student Research Workshop)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.550000011920929,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412889389.pdf","grobid_xml":"https://content.openalex.org/works/W4412889389.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2964976023","https://openalex.org/W1982477181","https://openalex.org/W2403083015","https://openalex.org/W4285488523","https://openalex.org/W2011367623","https://openalex.org/W4408384948","https://openalex.org/W2734065904"],"abstract_inverted_index":{"Large":[0],"language":[1,6,109,131],"models":[2,69],"often":[3],"suffer":[4],"from":[5,35],"confusion,":[7],"a":[8],"phenomenon":[9],"in":[10,18,27,37,133,137],"which":[11,45,93],"responses":[12],"are":[13],"partially":[14],"or":[15],"entirely":[16],"generated":[17],"unintended":[19],"languages.This":[20],"critically":[21],"degrades":[22],"the":[23,47,79],"user":[24],"experience,":[25],"especially":[26],"low-resource":[28,138],"settings.We":[29],"hypothesize":[30],"that":[31,68,123],"this":[32,88],"issue":[33],"stems":[34],"limitations":[36],"conventional":[38],"fine-tuning":[39],"objectives,":[40],"such":[41,57,86],"as":[42,58],"supervised":[43],"learning,":[44],"optimize":[46],"likelihood":[48],"of":[49,61,81],"correct":[50],"tokens":[51],"without":[52],"explicitly":[53],"penalizing":[54],"undesired":[55],"outputs":[56],"cross-lingual":[59],"mixing.Analysis":[60],"loss":[62],"trajectories":[63],"during":[64],"pretraining":[65],"further":[66],"reveals":[67],"fail":[70],"to":[71,84,100],"distinguish":[72],"between":[73],"monolingual":[74],"and":[75],"language-mixed":[76],"texts,":[77],"highlighting":[78],"absence":[80],"inherent":[82],"pressure":[83],"avoid":[85],"confusion.In":[87],"work,":[89],"we":[90],"apply":[91],"ORPO,":[92],"adds":[94],"penalties":[95],"for":[96],"unwanted":[97],"output":[98],"styles":[99],"standard":[101],"SFT,":[102],"effectively":[103,129],"suppressing":[104],"languageconfused":[105],"generations.ORPO":[106],"maintains":[107],"strong":[108],"consistency,":[110],"even":[111],"under":[112],"high":[113],"decoding":[114],"temperatures,":[115],"while":[116],"preserving":[117],"general":[118],"QA":[119],"performance.Our":[120],"findings":[121],"suggest":[122],"incorporating":[124],"appropriate":[125],"penalty":[126],"terms":[127],"can":[128],"mitigate":[130],"confusion":[132],"multilingual":[134],"models,":[135],"particularly":[136],"scenarios.":[139]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-11T06:11:40.159057","created_date":"2025-10-10T00:00:00"}
