{"id":"https://openalex.org/W7128608308","doi":"https://doi.org/10.48550/arxiv.2602.09826","title":"From FusHa to Folk: Exploring Cross-Lingual Transfer in Arabic Language Models","display_name":"From FusHa to Folk: Exploring Cross-Lingual Transfer in Arabic Language Models","publication_year":2026,"publication_date":"2026-02-10","ids":{"openalex":"https://openalex.org/W7128608308","doi":"https://doi.org/10.48550/arxiv.2602.09826"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.09826","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125670571","display_name":"Abdulmuizz Khalak","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Khalak, Abdulmuizz","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125639017","display_name":"Abderrahmane Issam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Issam, Abderrahmane","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125683024","display_name":"Gerasimos Spanakis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Spanakis, Gerasimos","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5125670571"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.2328999936580658,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.2328999936580658,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2076999992132187,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.04259999841451645,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modern-standard-arabic","display_name":"Modern Standard Arabic","score":0.7437999844551086},{"id":"https://openalex.org/keywords/arabic","display_name":"Arabic","score":0.7264999747276306},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.607200026512146},{"id":"https://openalex.org/keywords/transfer","display_name":"Transfer (computing)","score":0.5401999950408936},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4984999895095825},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.38530001044273376}],"concepts":[{"id":"https://openalex.org/C2778243841","wikidata":"https://www.wikidata.org/wiki/Q56467","display_name":"Modern Standard Arabic","level":3,"score":0.7437999844551086},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.7264999747276306},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6984000205993652},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6504999995231628},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.607200026512146},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.5401999950408936},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5313000082969666},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.5019000172615051},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4984999895095825},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.38530001044273376},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.3384000062942505},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.3043999969959259},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2921000123023987},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.2563999891281128}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.09826","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.09826","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.09826","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.09826","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8139217495918274,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Arabic":[0,10,52,71,120,135],"Language":[1,78],"Models":[2],"(LMs)":[3],"are":[4,13,42],"pretrained":[5],"predominately":[6],"on":[7,75],"Modern":[8],"Standard":[9],"(MSA)":[11],"and":[12,35,82,128],"expected":[14],"to":[15,17,61,99,117],"transfer":[16,69,89,133],"its":[18,55],"dialects.":[19,121],"While":[20],"MSA":[21],"as":[22],"the":[23,45],"standard":[24],"written":[25],"variety":[26],"is":[27,90],"commonly":[28],"used":[29],"in":[30,38,58,114,134],"formal":[31],"settings,":[32],"people":[33],"speak":[34],"write":[36],"online":[37],"various":[39],"dialects":[40,56],"that":[41,88],"spread":[43],"across":[44,94],"Arab":[46],"region.":[47],"This":[48,122],"poses":[49],"limitations":[50],"for":[51,111,131],"LMs,":[53],"since":[54],"vary":[57],"their":[59,104,124],"similarity":[60],"MSA.":[62],"In":[63],"this":[64],"work":[65],"we":[66,97,108],"study":[67],"cross-lingual":[68,132],"of":[70,126],"models":[72,115],"using":[73],"probing":[74],"3":[76],"Natural":[77],"Processing":[79],"(NLP)":[80],"Tasks,":[81],"representational":[83],"similarity.":[84],"Our":[85],"results":[86],"indicate":[87],"possible":[91],"but":[92],"disproportionate":[93],"dialects,":[95],"which":[96],"find":[98,109],"be":[100],"partially":[101],"explained":[102],"by":[103],"geographic":[105],"proximity.":[106],"Furthermore,":[107],"evidence":[110],"negative":[112],"interference":[113],"trained":[116],"support":[118],"all":[119],"questions":[123],"degree":[125],"similarity,":[127],"raises":[129],"concerns":[130],"models.":[136]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-12T00:00:00"}
