{"id":"https://openalex.org/W7130686328","doi":"https://doi.org/10.48550/arxiv.2602.16852","title":"Meenz bleibt Meenz, but Large Language Models Do Not Speak Its Dialect","display_name":"Meenz bleibt Meenz, but Large Language Models Do Not Speak Its Dialect","publication_year":2026,"publication_date":"2026-02-18","ids":{"openalex":"https://openalex.org/W7130686328","doi":"https://doi.org/10.48550/arxiv.2602.16852"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.16852","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050750082","display_name":"Minh Duc Bui","orcid":"https://orcid.org/0000-0002-0756-7136"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bui, Minh Duc","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048083543","display_name":"Manuel Mager","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mager, Manuel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090551220","display_name":"Peter Herbert Kann","orcid":"https://orcid.org/0000-0002-9099-3696"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kann, Peter Herbert","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126490084","display_name":"Katharina von der Wense","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"von der Wense, Katharina","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11640","display_name":"Linguistic Variation and Morphology","score":0.5103999972343445,"subfield":{"id":"https://openalex.org/subfields/3310","display_name":"Linguistics and Language"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11640","display_name":"Linguistic Variation and Morphology","score":0.5103999972343445,"subfield":{"id":"https://openalex.org/subfields/3310","display_name":"Linguistics and Language"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.21119999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.0551999993622303,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/german","display_name":"German","score":0.8378000259399414},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.492900013923645},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.47589999437332153},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.4731999933719635},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4260999858379364},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.40540000796318054},{"id":"https://openalex.org/keywords/computational-linguistics","display_name":"Computational linguistics","score":0.38940000534057617}],"concepts":[{"id":"https://openalex.org/C154775046","wikidata":"https://www.wikidata.org/wiki/Q188","display_name":"German","level":2,"score":0.8378000259399414},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.65420001745224},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6324999928474426},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5898000001907349},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.5677000284194946},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.492900013923645},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.47589999437332153},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.4731999933719635},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4260999858379364},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.40540000796318054},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.38940000534057617},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.38839998841285706},{"id":"https://openalex.org/C70777604","wikidata":"https://www.wikidata.org/wiki/Q257885","display_name":"Word order","level":2,"score":0.3407999873161316},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.3359000086784363},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.33390000462532043},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.2847000062465668},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.2802000045776367},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.27480000257492065},{"id":"https://openalex.org/C2780790391","wikidata":"https://www.wikidata.org/wiki/Q1149626","display_name":"Written language","level":2,"score":0.2646999955177307},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2540999948978424}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.16852","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.16852","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.16852","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.16852","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7520277500152588,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Meenzerisch,":[0,158],"the":[1,5,12,16,30,48,53,75,79,88,112,119,136,170,180,210,218,227],"dialect":[2,89,120,150],"spoken":[3],"in":[4,78,108,118,126,157,194],"German":[6,41,246],"city":[7],"of":[8,15,32,58,81,90,241],"Mainz,":[9],"is":[10,28,84,186,200],"also":[11],"traditional":[13],"language":[14,44,144],"Mainz":[17],"carnival,":[18],"a":[19,94],"yearly":[20],"celebration":[21],"well":[22],"known":[23],"throughout":[24],"Germany.":[25],"However,":[26,62],"Meenzerisch":[27],"on":[29,87,245],"verge":[31],"dying":[33],"out-a":[34],"fate":[35],"it":[36],"shares":[37],"with":[38,52,122],"many":[39],"other":[40],"dialects.":[42,61],"Natural":[43],"processing":[45],"(NLP)":[46],"has":[47,68],"potential":[49],"to":[50,134,196,217,225],"help":[51],"preservation":[54],"and":[55,60,110,179,205,238],"revival":[56],"efforts":[57,243],"languages":[59],"so":[63],"far":[64],"no":[65],"NLP":[66,82],"research":[67,77,138,242],"looked":[69],"at":[70],"Meenzerisch.":[71],"This":[72,233],"work":[73],"presents":[74],"first":[76],"field":[80],"that":[83,165,235],"explicitly":[85],"focused":[86,244],"Mainz.":[91],"We":[92,129,188],"introduce":[93],"digital":[95],"dictionary-an":[96],"NLP-ready":[97],"dataset":[98,133],"derived":[99],"from":[100,209],"an":[101,239],"existing":[102],"resource":[103],"(Schramm,":[104],"1966)-to":[105],"support":[106],"researchers":[107],"modeling":[109],"benchmarking":[111],"language.":[113],"It":[114],"contains":[115],"2,351":[116],"words":[117,156],"paired":[121],"their":[123,160],"meanings":[124],"described":[125],"Standard":[127],"German.":[128],"then":[130,189,215],"use":[131],"this":[132],"answer":[135],"following":[137],"questions:":[139],"(1)":[140],"Can":[141,153],"state-of-the-art":[142],"large":[143],"models":[145],"(LLMs)":[146],"generate":[147,155],"definitions":[148,174],"for":[149,173],"words?":[151],"(2)":[152],"LLMs":[154,166],"given":[159],"definitions?":[161],"Our":[162],"experiments":[163,193],"show":[164],"can":[167],"do":[168],"neither:":[169],"best":[171,181],"model":[172],"reaches":[175],"only":[176],"6.27%":[177],"accuracy":[178,185,199,229],"word":[182],"generation":[183],"model's":[184],"1.51%.":[187],"conduct":[190],"two":[191],"additional":[192,236],"order":[195],"see":[197],"if":[198],"improved":[201],"by":[202,206],"few-shot":[203],"learning":[204],"extracting":[207],"rules":[208],"training":[211],"set,":[212],"which":[213],"are":[214,223,248],"passed":[216],"LLM.":[219],"While":[220],"those":[221],"approaches":[222],"able":[224],"improve":[226],"results,":[228],"remains":[230],"below":[231],"10%.":[232],"highlights":[234],"resources":[237],"intensification":[240],"dialects":[247],"desperately":[249],"needed.":[250]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-21T00:00:00"}
