{"id":"https://openalex.org/W2123447988","doi":"https://doi.org/10.1017/s1351324915000030","title":"Arabic spelling error detection and correction","display_name":"Arabic spelling error detection and correction","publication_year":2015,"publication_date":"2015-03-18","ids":{"openalex":"https://openalex.org/W2123447988","doi":"https://doi.org/10.1017/s1351324915000030","mag":"2123447988"},"language":"en","primary_location":{"id":"doi:10.1017/s1351324915000030","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324915000030","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075586667","display_name":"Mohammed Attia","orcid":null},"institutions":[{"id":"https://openalex.org/I193260172","display_name":"British University in Dubai","ror":"https://ror.org/00mc18523","country_code":"AE","type":"education","lineage":["https://openalex.org/I193260172"]},{"id":"https://openalex.org/I42934936","display_name":"Dublin City University","ror":"https://ror.org/04a1a1e81","country_code":"IE","type":"education","lineage":["https://openalex.org/I42934936"]}],"countries":["AE","IE"],"is_corresponding":true,"raw_author_name":"MOHAMMED ATTIA","raw_affiliation_strings":["Faculty of Engineering and IT, The British University in Dubai, UAE e-mail:","School of Computing, Dublin City University, Ireland, e-mail:"],"affiliations":[{"raw_affiliation_string":"Faculty of Engineering and IT, The British University in Dubai, UAE e-mail:","institution_ids":["https://openalex.org/I193260172"]},{"raw_affiliation_string":"School of Computing, Dublin City University, Ireland, e-mail:","institution_ids":["https://openalex.org/I42934936"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019260966","display_name":"Pavel Pecina","orcid":"https://orcid.org/0000-0002-1855-5931"},"institutions":[{"id":"https://openalex.org/I21250087","display_name":"Charles University","ror":"https://ror.org/024d6js02","country_code":"CZ","type":"education","lineage":["https://openalex.org/I21250087"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"PAVEL PECINA","raw_affiliation_strings":["Faculty of Mathematics and Physics, Charles University in Prague, Czech Republic e-mail:"],"affiliations":[{"raw_affiliation_string":"Faculty of Mathematics and Physics, Charles University in Prague, Czech Republic e-mail:","institution_ids":["https://openalex.org/I21250087"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086381528","display_name":"Younes Samih","orcid":"https://orcid.org/0000-0002-0485-7920"},"institutions":[{"id":"https://openalex.org/I44260953","display_name":"Heinrich Heine University D\u00fcsseldorf","ror":"https://ror.org/024z2rq82","country_code":"DE","type":"education","lineage":["https://openalex.org/I44260953"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"YOUNES SAMIH","raw_affiliation_strings":["Department of Linguistics and Information Science, Heinrich-Heine-Universit\u00e4t D\u00fcsseldorf, Germany e-mail:"],"affiliations":[{"raw_affiliation_string":"Department of Linguistics and Information Science, Heinrich-Heine-Universit\u00e4t D\u00fcsseldorf, Germany e-mail:","institution_ids":["https://openalex.org/I44260953"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066945309","display_name":"Khaled Shaalan","orcid":"https://orcid.org/0000-0003-0823-8390"},"institutions":[{"id":"https://openalex.org/I193260172","display_name":"British University in Dubai","ror":"https://ror.org/00mc18523","country_code":"AE","type":"education","lineage":["https://openalex.org/I193260172"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"KHALED SHAALAN","raw_affiliation_strings":["Faculty of Engineering and IT, The British University in Dubai, UAE e-mail:"],"affiliations":[{"raw_affiliation_string":"Faculty of Engineering and IT, The British University in Dubai, UAE e-mail:","institution_ids":["https://openalex.org/I193260172"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049194403","display_name":"Josef van Genabith","orcid":"https://orcid.org/0000-0003-1322-7944"},"institutions":[{"id":"https://openalex.org/I42934936","display_name":"Dublin City University","ror":"https://ror.org/04a1a1e81","country_code":"IE","type":"education","lineage":["https://openalex.org/I42934936"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"JOSEF VAN GENABITH","raw_affiliation_strings":["School of Computing, Dublin City University, Ireland, e-mail:"],"affiliations":[{"raw_affiliation_string":"School of Computing, Dublin City University, Ireland, e-mail:","institution_ids":["https://openalex.org/I42934936"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5075586667"],"corresponding_institution_ids":["https://openalex.org/I193260172","https://openalex.org/I42934936"],"apc_list":null,"apc_paid":null,"fwci":0.8629,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.82396218,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"22","issue":"5","first_page":"751","last_page":"773"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.909677267074585},{"id":"https://openalex.org/keywords/spelling","display_name":"Spelling","score":0.9010275602340698},{"id":"https://openalex.org/keywords/arabic","display_name":"Arabic","score":0.6978920698165894},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6454095840454102},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6118083000183105},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5844944715499878},{"id":"https://openalex.org/keywords/error-detection-and-correction","display_name":"Error detection and correction","score":0.5563941597938538},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5037173628807068},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4532814621925354},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1585438847541809},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.10945117473602295}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.909677267074585},{"id":"https://openalex.org/C2777801307","wikidata":"https://www.wikidata.org/wiki/Q2088390","display_name":"Spelling","level":2,"score":0.9010275602340698},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.6978920698165894},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6454095840454102},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6118083000183105},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5844944715499878},{"id":"https://openalex.org/C103088060","wikidata":"https://www.wikidata.org/wiki/Q1062839","display_name":"Error detection and correction","level":2,"score":0.5563941597938538},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5037173628807068},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4532814621925354},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1585438847541809},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.10945117473602295},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1017/s1351324915000030","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324915000030","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7900000214576721,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W24718583","https://openalex.org/W126222424","https://openalex.org/W1516896190","https://openalex.org/W1552461563","https://openalex.org/W1553646478","https://openalex.org/W1577352519","https://openalex.org/W1581233860","https://openalex.org/W1647671624","https://openalex.org/W1650656906","https://openalex.org/W1860104593","https://openalex.org/W1935410517","https://openalex.org/W1972099155","https://openalex.org/W1987385324","https://openalex.org/W2010595692","https://openalex.org/W2018616927","https://openalex.org/W2057900969","https://openalex.org/W2066792529","https://openalex.org/W2076772758","https://openalex.org/W2099412388","https://openalex.org/W2101200183","https://openalex.org/W2121227244","https://openalex.org/W2124397360","https://openalex.org/W2126784811","https://openalex.org/W2140563376","https://openalex.org/W2159781504","https://openalex.org/W2167730892","https://openalex.org/W2170276118","https://openalex.org/W2250268234","https://openalex.org/W2600716915","https://openalex.org/W2733628661","https://openalex.org/W2911716267","https://openalex.org/W2912409473","https://openalex.org/W2913539360","https://openalex.org/W2968573267","https://openalex.org/W4246663459","https://openalex.org/W4248506830","https://openalex.org/W6605210145","https://openalex.org/W6636891654","https://openalex.org/W6636915900","https://openalex.org/W6640227696","https://openalex.org/W6678277124","https://openalex.org/W6678359804","https://openalex.org/W6681049082"],"related_works":["https://openalex.org/W2161008081","https://openalex.org/W2100947578","https://openalex.org/W4298186509","https://openalex.org/W2556702969","https://openalex.org/W217221262","https://openalex.org/W611030372","https://openalex.org/W1974418053","https://openalex.org/W2021532426","https://openalex.org/W2081317458","https://openalex.org/W2944691285"],"abstract_inverted_index":{"Abstract":[0],"A":[1],"spelling":[2],"error":[3,22,92,96],"detection":[4],"and":[5,24,81,86,98,120,131,146],"correction":[6],"application":[7],"is":[8],"typically":[9],"based":[10],"on":[11],"three":[12,51],"main":[13],"components:":[14],"a":[15,25,78,82],"dictionary":[16,69],"(or":[17],"reference":[18],"word":[19],"list),":[20],"an":[21,100,122],"model":[23,93,109],"language":[26,41,108],"model.":[27],"While":[28],"most":[29],"of":[30,49,63,70,114],"the":[31,34,40,50,60,64,91,107,112,127],"attention":[32],"in":[33,47,59,116],"literature":[35],"has":[36],"been":[37],"directed":[38],"to":[39,55,125],"model,":[42],"we":[43],"show":[44,134],"how":[45],"improvements":[46,58],"any":[48],"components":[52],"can":[53],"lead":[54],"significant":[56],"cumulative":[57],"overall":[61],"performance":[62],"system.":[65],"We":[66,89,104],"develop":[67],"our":[68,136],"9.2":[71],"million":[72],"fully-inflected":[73],"Arabic":[74],"words":[75],"(types)":[76],"from":[77],"morphological":[79],"transducer":[80],"large":[83],"corpus,":[84],"validated":[85],"manually":[87],"revised.":[88],"improve":[90,106],"by":[94,110],"analyzing":[95,111],"types":[97],"creating":[99],"edit":[101],"distance":[102],"re-ranker.":[103],"also":[105],"level":[113],"noise":[115],"different":[117],"data":[118],"sources":[119],"selecting":[121],"optimal":[123],"subset":[124],"train":[126],"system":[128,137],"on.":[129],"Testing":[130],"evaluation":[132],"experiments":[133],"that":[135],"significantly":[138],"outperforms":[139],"Microsoft":[140],"Word":[141],"2013,":[142],"OpenOffice":[143],"Ayaspell":[144],"3.4":[145],"Google":[147],"Docs.":[148]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":3},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
