{"id":"https://openalex.org/W4393407232","doi":"https://doi.org/10.1109/aiccsa59173.2023.10479250","title":"Lisan: Yemeni, Iraqi, Libyan, and Sudanese Arabic Dialect Corpora with Morphological Annotations","display_name":"Lisan: Yemeni, Iraqi, Libyan, and Sudanese Arabic Dialect Corpora with Morphological Annotations","publication_year":2023,"publication_date":"2023-12-04","ids":{"openalex":"https://openalex.org/W4393407232","doi":"https://doi.org/10.1109/aiccsa59173.2023.10479250"},"language":"en","primary_location":{"id":"doi:10.1109/aiccsa59173.2023.10479250","is_oa":false,"landing_page_url":"https://doi.org/10.1109/aiccsa59173.2023.10479250","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 20th ACS/IEEE International Conference on Computer Systems and Applications (AICCSA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050418400","display_name":"Mustafa Jarrar","orcid":"https://orcid.org/0000-0003-4351-4207"},"institutions":[{"id":"https://openalex.org/I94800806","display_name":"Birzeit University","ror":"https://ror.org/0256kw398","country_code":"PS","type":"education","lineage":["https://openalex.org/I94800806"]}],"countries":["PS"],"is_corresponding":true,"raw_author_name":"Mustafa Jarrar","raw_affiliation_strings":["Birzeit University,Birzeit,Palestine","Birzeit University, Birzeit, Palestine"],"affiliations":[{"raw_affiliation_string":"Birzeit University,Birzeit,Palestine","institution_ids":["https://openalex.org/I94800806"]},{"raw_affiliation_string":"Birzeit University, Birzeit, Palestine","institution_ids":["https://openalex.org/I94800806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010806171","display_name":"Fadi A. Zaraket","orcid":"https://orcid.org/0000-0001-5909-6375"},"institutions":[{"id":"https://openalex.org/I98635879","display_name":"American University of Beirut","ror":"https://ror.org/04pznsd21","country_code":"LB","type":"education","lineage":["https://openalex.org/I98635879"]}],"countries":["LB"],"is_corresponding":false,"raw_author_name":"Fadi A Zaraket","raw_affiliation_strings":["American University of Beirut,Beirut,Lebanon","American University of Beirut, Beirut, Lebanon"],"affiliations":[{"raw_affiliation_string":"American University of Beirut,Beirut,Lebanon","institution_ids":["https://openalex.org/I98635879"]},{"raw_affiliation_string":"American University of Beirut, Beirut, Lebanon","institution_ids":["https://openalex.org/I98635879"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049723879","display_name":"Tymaa Hammouda","orcid":null},"institutions":[{"id":"https://openalex.org/I94800806","display_name":"Birzeit University","ror":"https://ror.org/0256kw398","country_code":"PS","type":"education","lineage":["https://openalex.org/I94800806"]}],"countries":["PS"],"is_corresponding":false,"raw_author_name":"Tymaa Hammouda","raw_affiliation_strings":["Birzeit University,Birzeit,Palestine","Birzeit University, Birzeit, Palestine"],"affiliations":[{"raw_affiliation_string":"Birzeit University,Birzeit,Palestine","institution_ids":["https://openalex.org/I94800806"]},{"raw_affiliation_string":"Birzeit University, Birzeit, Palestine","institution_ids":["https://openalex.org/I94800806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025455042","display_name":"Daanish Masood Alavi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Daanish Masood Alavi","raw_affiliation_strings":["Peace-Building and Political Affairs,UN Department,New York,USA","UN Department, Peace-Building and Political Affairs, New York, USA"],"affiliations":[{"raw_affiliation_string":"Peace-Building and Political Affairs,UN Department,New York,USA","institution_ids":[]},{"raw_affiliation_string":"UN Department, Peace-Building and Political Affairs, New York, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012925715","display_name":"Martin W\u00e4hlisch","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Martin W\u00e4hlisch","raw_affiliation_strings":["Peace-Building and Political Affairs,UN Department,New York,USA","UN Department, Peace-Building and Political Affairs, New York, USA"],"affiliations":[{"raw_affiliation_string":"Peace-Building and Political Affairs,UN Department,New York,USA","institution_ids":[]},{"raw_affiliation_string":"UN Department, Peace-Building and Political Affairs, New York, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5050418400"],"corresponding_institution_ids":["https://openalex.org/I94800806"],"apc_list":null,"apc_paid":null,"fwci":0.3554,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.69150144,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.984000027179718,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.984000027179718,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13912","display_name":"Language, Linguistics, Cultural Analysis","score":0.983299970626831,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13623","display_name":"Linguistic Studies and Language Acquisition","score":0.929099977016449,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/arabic","display_name":"Arabic","score":0.8840056657791138},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5649476647377014},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5224962830543518},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.5152814388275146},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46666187047958374},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.06284183263778687}],"concepts":[{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.8840056657791138},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5649476647377014},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5224962830543518},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.5152814388275146},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46666187047958374},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.06284183263778687}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/aiccsa59173.2023.10479250","is_oa":false,"landing_page_url":"https://doi.org/10.1109/aiccsa59173.2023.10479250","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 20th ACS/IEEE International Conference on Computer Systems and Applications (AICCSA)","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/8250ebac-6ce4-4149-bd41-3f626044a360","is_oa":false,"landing_page_url":"https://research.birmingham.ac.uk/en/publications/8250ebac-6ce4-4149-bd41-3f626044a360","pdf_url":null,"source":{"id":"https://openalex.org/S4306402634","display_name":"University of Birmingham Research Portal (University of Birmingham)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79619799","host_organization_name":"University of Birmingham","host_organization_lineage":["https://openalex.org/I79619799"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Jarrar, M, Zaraket, F A, Hammouda, T, Alavi, D M & Wahlisch, M 2024, Lisan : Yemeni, Iraqi, Libyan, and Sudanese Arabic Dialect Corpora with Morphological Annotations. in 2023 20th ACS/IEEE International Conference on Computer Systems and Applications (AICCSA). Proceedings of IEEE/ACS International Conference on Computer Systems and Applications, AICCSA, IEEE, 20th ACS/IEEE International Conference on Computer Systems and Applications, AICCSA 2023, Giza, Egypt, 4/12/23. https://doi.org/10.1109/AICCSA59173.2023.10479250","raw_type":"contributionToPeriodical"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.4099999964237213,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1993757038","https://openalex.org/W2117202778","https://openalex.org/W2560280095","https://openalex.org/W2612649659","https://openalex.org/W2614322402","https://openalex.org/W2756623576","https://openalex.org/W2771976988","https://openalex.org/W2799399790","https://openalex.org/W2949354012","https://openalex.org/W2970442528","https://openalex.org/W2997186977","https://openalex.org/W3011470788","https://openalex.org/W3114605654","https://openalex.org/W3149627794","https://openalex.org/W3178570354","https://openalex.org/W3213358601","https://openalex.org/W4205509257","https://openalex.org/W4294214983","https://openalex.org/W4385573366","https://openalex.org/W4391156274","https://openalex.org/W6601625150","https://openalex.org/W6605374713","https://openalex.org/W6690971519","https://openalex.org/W6690972069","https://openalex.org/W6744301851","https://openalex.org/W6751400415","https://openalex.org/W6753010206","https://openalex.org/W6766750367","https://openalex.org/W6786709265","https://openalex.org/W6838679636","https://openalex.org/W6838992615","https://openalex.org/W6839581624","https://openalex.org/W6849158869","https://openalex.org/W6849686114","https://openalex.org/W6890250144","https://openalex.org/W6890314154","https://openalex.org/W6909269736"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4249048193","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W3204019825"],"abstract_inverted_index":{"This":[0],"article":[1],"presents":[2],"morphologically-annotated":[3],"Yemeni,":[4],"Sudanese,":[5],"Iraqi,":[6],"and":[7,58,61,90,92,105,122,128,139,149],"Libyan":[8],"Arabic":[9,113],"dialects":[10,48,73],"(${\\text{L}\\hat{\\text{i}}\\text{sa}\\bar{\\text{n}}}$)":[11],"corpora.":[12],"${\\text{L}\\hat{\\text{i}}\\text{sa}\\bar{\\text{n}}}$":[13],"features":[14,98],"around":[15],"1.2":[16],"million":[17],"tokens.":[18],"We":[19,110,131],"collected":[20,38,55],"the":[21,24,45,71,76,84,112,120,150],"content":[22],"of":[23,44,70,102,137],"corpora":[25,43,86,152],"from":[26,40,56],"several":[27],"social":[28],"media":[29],"platforms.":[30],"The":[31,42,78],"Yemeni":[32],"corpus":[33],"($\\tilde":[34,49],"1.05{\\text{M}}$":[35],"tokens)":[36],"was":[37,53],"automatically":[39],"Twitter.":[41],"other":[46],"three":[47],"50{\\text{K}}$":[50],"tokens":[51],"each)":[52],"manually":[54],"Facebook":[57],"YouTube":[59],"posts":[60],"comments.":[62],"Thirty-five":[63],"(35)":[64],"annotators":[65,79,121,133],"who":[66],"are":[67,153],"native":[68],"speakers":[69],"target":[72],"carried":[74],"out":[75],"annotations.":[77],"segmented":[80],"all":[81],"words":[82],"in":[83,108],"four":[85,151],"into":[87],"prefixes,":[88],"stems":[89],"suffixes":[91],"labeled":[93],"each":[94],"with":[95,126],"different":[96],"morphological":[97],"such":[99],"as":[100],"part":[101],"speech,":[103],"lemma,":[104],"a":[106,135],"gloss":[107],"English.":[109],"developed":[111],"Dialect":[114],"Annotation":[115],"Toolkit":[116],"(ADAT)":[117],"to":[118,123,142],"assist":[119],"ensure":[124],"compatibility":[125],"SAMA":[127],"Curras":[129],"tagsets.":[130],"trained":[132],"on":[134,140],"set":[136],"guidelines":[138],"how":[141],"use":[143],"ADAT.":[144],"ADAT":[145],"is":[146],"open":[147],"source,":[148],"available":[154],"at":[155],"https://sina.birzeit.edu/currasat.":[156]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
