{"id":"https://openalex.org/W7125530491","doi":"https://doi.org/10.48550/arxiv.2601.15337","title":"Language Models Entangle Language and Culture","display_name":"Language Models Entangle Language and Culture","publication_year":2026,"publication_date":"2026-01-20","ids":{"openalex":"https://openalex.org/W7125530491","doi":"https://doi.org/10.48550/arxiv.2601.15337"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.15337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.15337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.15337","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109465151","display_name":"Shourya Jain","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jain, Shourya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5123504887","display_name":"Paras Chopra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chopra, Paras","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5109465151"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.6370000243186951,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.6370000243186951,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.07580000162124634,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13194","display_name":"ICT in Developing Communities","score":0.031599998474121094,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6794999837875366},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.598800003528595},{"id":"https://openalex.org/keywords/disadvantaged","display_name":"Disadvantaged","score":0.5950000286102295},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5493000149726868},{"id":"https://openalex.org/keywords/on-language","display_name":"On Language","score":0.439300000667572},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.41600000858306885},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3409000039100647}],"concepts":[{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6794999837875366},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.598800003528595},{"id":"https://openalex.org/C2780623907","wikidata":"https://www.wikidata.org/wiki/Q106394435","display_name":"Disadvantaged","level":2,"score":0.5950000286102295},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5493000149726868},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5142999887466431},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4959999918937683},{"id":"https://openalex.org/C2779313563","wikidata":"https://www.wikidata.org/wiki/Q17072565","display_name":"On Language","level":2,"score":0.439300000667572},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.41600000858306885},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.40380001068115234},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3409000039100647},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.33820000290870667},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.33070001006126404},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2937999963760376},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.27570000290870667},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.2703999876976013},{"id":"https://openalex.org/C2777673361","wikidata":"https://www.wikidata.org/wiki/Q5281228","display_name":"Disadvantage","level":2,"score":0.26570001244544983},{"id":"https://openalex.org/C83479923","wikidata":"https://www.wikidata.org/wiki/Q2063748","display_name":"Universal Networking Language","level":4,"score":0.26409998536109924},{"id":"https://openalex.org/C125209646","wikidata":"https://www.wikidata.org/wiki/Q1338878","display_name":"Cultural diversity","level":2,"score":0.2583000063896179},{"id":"https://openalex.org/C1813318","wikidata":"https://www.wikidata.org/wiki/Q2465887","display_name":"Language industry","level":4,"score":0.2533999979496002},{"id":"https://openalex.org/C2778883600","wikidata":"https://www.wikidata.org/wiki/Q2390977","display_name":"Language proficiency","level":2,"score":0.25209999084472656}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.15337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.15337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.15337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.15337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.8330137729644775}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Users":[0],"should":[1,19],"not":[2],"be":[3],"systemically":[4],"disadvantaged":[5],"by":[6,56,97,153],"the":[7,45,64,69,88,95,102,120,149,154,161,164],"language":[8,27,65,75,86,146],"they":[9],"use":[10,49],"for":[11],"interacting":[12],"with":[13],"LLMs;":[14],"i.e.":[15],"users":[16],"across":[17,123],"languages":[18],"get":[20],"responses":[21,54],"of":[22,26,36,44,85,119,163],"similar":[23],"quality":[24,61,134,162],"irrespective":[25],"used.":[28],"In":[29],"this":[30],"work,":[31],"we":[32,112],"create":[33],"a":[34,116],"set":[35],"real-world":[37],"open-ended":[38,137],"questions":[39,138],"based":[40],"on":[41,63,115],"our":[42],"analysis":[43],"WildChat":[46],"dataset":[47],"and":[48,76,91],"it":[50],"to":[51,67,100,136],"evaluate":[52,113],"whether":[53,59],"vary":[55],"language,":[57],"specifically,":[58],"answer":[60],"depends":[62],"used":[66,93,152],"query":[68],"model.":[70,155],"We":[71,143],"also":[72],"investigate":[73,110],"how":[74],"culture":[77],"are":[78],"entangled":[79],"in":[80,94,106,139,158],"LLMs":[81,114,130],"such":[82],"that":[83,129,145],"choice":[84],"changes":[87],"cultural":[89,103,150],"information":[90],"context":[92,104,151,159],"response":[96],"using":[98],"LLM-as-a-Judge":[99],"identify":[101],"present":[105],"responses.":[107],"To":[108],"further":[109],"this,":[111],"translated":[117],"subset":[118],"CulturalBench":[121],"benchmark":[122],"multiple":[124],"languages.":[125,142],"Our":[126],"evaluations":[127],"reveal":[128],"consistently":[131],"provide":[132],"lower":[133],"answers":[135],"low":[140],"resource":[141],"find":[144],"significantly":[147],"impacts":[148,160],"This":[156],"difference":[157],"downstream":[165],"answer.":[166]},"counts_by_year":[],"updated_date":"2026-01-24T23:27:35.965710","created_date":"2026-01-24T00:00:00"}
