{"id":"https://openalex.org/W1984708705","doi":"https://doi.org/10.1145/1644879.1644881","title":"Arabic Natural Language Processing","display_name":"Arabic Natural Language Processing","publication_year":2009,"publication_date":"2009-12-01","ids":{"openalex":"https://openalex.org/W1984708705","doi":"https://doi.org/10.1145/1644879.1644881","mag":"1984708705"},"language":"en","primary_location":{"id":"doi:10.1145/1644879.1644881","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1644879.1644881","pdf_url":null,"source":{"id":"https://openalex.org/S56575750","display_name":"ACM Transactions on Asian Language Information Processing","issn_l":"1530-0226","issn":["1530-0226","1558-3430"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Asian Language Information Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009712450","display_name":"Ali Farghaly","orcid":null},"institutions":[{"id":"https://openalex.org/I36943572","display_name":"Middlebury Institute of International Studies at Monterey","ror":"https://ror.org/05d1z6q04","country_code":"US","type":"education","lineage":["https://openalex.org/I36943572"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ali Farghaly","raw_affiliation_strings":["Monterey Institute of International Studies","Monterey Institute of International Studies,"],"affiliations":[{"raw_affiliation_string":"Monterey Institute of International Studies","institution_ids":["https://openalex.org/I36943572"]},{"raw_affiliation_string":"Monterey Institute of International Studies,","institution_ids":["https://openalex.org/I36943572"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066945309","display_name":"Khaled Shaalan","orcid":"https://orcid.org/0000-0003-0823-8390"},"institutions":[{"id":"https://openalex.org/I193260172","display_name":"British University in Dubai","ror":"https://ror.org/00mc18523","country_code":"AE","type":"education","lineage":["https://openalex.org/I193260172"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Khaled Shaalan","raw_affiliation_strings":["The British University in Dubai"],"affiliations":[{"raw_affiliation_string":"The British University in Dubai","institution_ids":["https://openalex.org/I193260172"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5009712450"],"corresponding_institution_ids":["https://openalex.org/I36943572"],"apc_list":null,"apc_paid":null,"fwci":12.1637,"has_fulltext":false,"cited_by_count":535,"citation_normalized_percentile":{"value":0.98639031,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"8","issue":"4","first_page":"1","last_page":"22"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7379429340362549},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.6002711653709412},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5177463889122009},{"id":"https://openalex.org/keywords/section","display_name":"Section (typography)","score":0.49891138076782227},{"id":"https://openalex.org/keywords/arabic","display_name":"Arabic","score":0.462227463722229},{"id":"https://openalex.org/keywords/classical-arabic","display_name":"Classical Arabic","score":0.4298292398452759},{"id":"https://openalex.org/keywords/modern-standard-arabic","display_name":"Modern Standard Arabic","score":0.4225456118583679},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3956184387207031}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7379429340362549},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.6002711653709412},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5177463889122009},{"id":"https://openalex.org/C2780129039","wikidata":"https://www.wikidata.org/wiki/Q1931107","display_name":"Section (typography)","level":2,"score":0.49891138076782227},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.462227463722229},{"id":"https://openalex.org/C2780770203","wikidata":"https://www.wikidata.org/wiki/Q1654327","display_name":"Classical Arabic","level":3,"score":0.4298292398452759},{"id":"https://openalex.org/C2778243841","wikidata":"https://www.wikidata.org/wiki/Q56467","display_name":"Modern Standard Arabic","level":3,"score":0.4225456118583679},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3956184387207031},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1644879.1644881","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1644879.1644881","pdf_url":null,"source":{"id":"https://openalex.org/S56575750","display_name":"ACM Transactions on Asian Language Information Processing","issn_l":"1530-0226","issn":["1530-0226","1558-3430"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Asian Language Information Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8600000143051147,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W84280981","https://openalex.org/W146914567","https://openalex.org/W201141796","https://openalex.org/W207781496","https://openalex.org/W275768480","https://openalex.org/W332987524","https://openalex.org/W609568101","https://openalex.org/W1504308005","https://openalex.org/W1550053614","https://openalex.org/W1558584194","https://openalex.org/W1580467103","https://openalex.org/W1586060904","https://openalex.org/W1722351164","https://openalex.org/W1764109662","https://openalex.org/W1970482722","https://openalex.org/W1974123979","https://openalex.org/W1978174332","https://openalex.org/W1981818098","https://openalex.org/W2008304070","https://openalex.org/W2022414723","https://openalex.org/W2027740070","https://openalex.org/W2038248725","https://openalex.org/W2042777049","https://openalex.org/W2043178336","https://openalex.org/W2061443933","https://openalex.org/W2068882115","https://openalex.org/W2086194511","https://openalex.org/W2096630656","https://openalex.org/W2097229755","https://openalex.org/W2100976324","https://openalex.org/W2103667219","https://openalex.org/W2134141008","https://openalex.org/W2139813717","https://openalex.org/W2141909255","https://openalex.org/W2148398225","https://openalex.org/W2164347990","https://openalex.org/W2170716495","https://openalex.org/W2484386651","https://openalex.org/W2753170778","https://openalex.org/W2779559028","https://openalex.org/W2890439761","https://openalex.org/W4206415992","https://openalex.org/W4240298715","https://openalex.org/W4388167510"],"related_works":["https://openalex.org/W2620283452","https://openalex.org/W4322750817","https://openalex.org/W4400896925","https://openalex.org/W2801712537","https://openalex.org/W4396221470","https://openalex.org/W587642979","https://openalex.org/W2489270562","https://openalex.org/W2894059694","https://openalex.org/W4388343295","https://openalex.org/W4403231732"],"abstract_inverted_index":{"The":[0,21,127],"Arabic":[1,14,49,61,98,112,121,130,158,180,191,199,201,206,252],"language":[2,9,51,62,79,99,122,192],"presents":[3,108],"researchers":[4,231],"and":[5,16,33,42,67,69,101,132,140,160,174,211,246],"developers":[6],"of":[7,23,30,48,59,77,83,89,96,111,119,129,156,163,170,189,198,244,249,257],"natural":[8,50],"processing":[10,52],"(NLP)":[11],"applications":[12,137],"for":[13,135],"text":[15],"speech":[17],"with":[18,56,144,153],"serious":[19],"challenges.":[20],"purpose":[22],"this":[24,90,145],"article":[25,91],"is":[26],"to":[27,34,73,142,217,241],"describe":[28,102],"some":[29,36,229],"these":[31,214],"challenges":[32],"present":[35,183,221],"solutions":[37,222],"that":[38,165,223],"would":[39],"guide":[40],"current":[41],"future":[43],"practitioners":[44],"in":[45,63,80,178,184,232],"the":[46,60,78,81,84,94,97,109,116,120,154,157,161,168,190,195,212,233,242,255],"field":[47],"(ANLP).":[53],"We":[54,182,219],"begin":[55],"general":[57,104],"features":[58,188],"Sections":[64],"1,":[65],"2,":[66],"3":[68,151],"then":[70],"we":[71,92,238,265],"move":[72],"more":[74,258],"specific":[75,187],"properties":[76,155,215],"rest":[82],"article.":[85],"In":[86,235,262],"Section":[87,106,150,185,236,263],"1":[88],"highlight":[93],"significance":[95],"today":[100],"its":[103,133],"properties.":[105],"2":[107],"feature":[110],"Diglossia":[113,131],"showing":[114],"how":[115],"sociolinguistic":[117],"aspects":[118],"differ":[123],"from":[124,167],"other":[125],"languages.":[126],"stability":[128],"implications":[134],"ANLP":[136,260],"are":[138,148],"discussed":[139],"ways":[141],"deal":[143],"problematic":[146],"property":[147,197],"proposed.":[149],"deals":[152],"script":[159],"explosion":[162],"ambiguity":[164],"results":[166],"absence":[169],"short":[171],"vowel":[172],"representations":[173],"overt":[175],"case":[176],"markers":[177],"contemporary":[179],"texts.":[181],"4":[186],"such":[193],"as":[194,202,207],"nonconcatenative":[196],"morphology,":[200],"an":[203],"agglutinative":[204],"language,":[205,210],"a":[208],"pro-drop":[209],"challenge":[213],"pose":[216],"ANLP.":[218],"also":[220],"have":[224],"already":[225],"been":[226],"adopted":[227],"by":[228],"pioneering":[230],"field.":[234],"5":[237],"point":[239],"out":[240],"lack":[243],"formal":[245],"explicit":[247],"grammars":[248],"Modern":[250],"Standard":[251],"which":[253],"impedes":[254],"progress":[256],"advanced":[259],"systems.":[261],"6":[264],"draw":[266],"our":[267],"conclusion.":[268]},"counts_by_year":[{"year":2026,"cited_by_count":11},{"year":2025,"cited_by_count":40},{"year":2024,"cited_by_count":36},{"year":2023,"cited_by_count":57},{"year":2022,"cited_by_count":33},{"year":2021,"cited_by_count":73},{"year":2020,"cited_by_count":39},{"year":2019,"cited_by_count":44},{"year":2018,"cited_by_count":34},{"year":2017,"cited_by_count":39},{"year":2016,"cited_by_count":27},{"year":2015,"cited_by_count":35},{"year":2014,"cited_by_count":26},{"year":2013,"cited_by_count":14},{"year":2012,"cited_by_count":11}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
