{"id":"https://openalex.org/W2251265054","doi":"https://doi.org/10.3115/v1/w14-3608","title":"Automatic Arabic diacritics restoration based on deep nets","display_name":"Automatic Arabic diacritics restoration based on deep nets","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2251265054","doi":"https://doi.org/10.3115/v1/w14-3608","mag":"2251265054"},"language":"en","primary_location":{"id":"doi:10.3115/v1/w14-3608","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-3608","pdf_url":"https://doi.org/10.3115/v1/w14-3608","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the EMNLP 2014 Workshop on Arabic Natural Language Processing (ANLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.3115/v1/w14-3608","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006404143","display_name":"Ahmad A. Al Sallab","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmad Al Sallab","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030016694","display_name":"Mohsen Rashwan","orcid":"https://orcid.org/0000-0003-3712-5408"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mohsen Rashwan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060184747","display_name":"Hazem Raafat","orcid":"https://orcid.org/0000-0001-7356-5078"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hazem M. Raafat","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5058725522","display_name":"Ahmed Rafea","orcid":"https://orcid.org/0000-0001-8109-1845"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmed Rafea","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.3833,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.93400829,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"65","last_page":"72"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6841470003128052},{"id":"https://openalex.org/keywords/arabic","display_name":"Arabic","score":0.6572460532188416},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5066271424293518},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5046504735946655},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.34961646795272827},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.16468289494514465},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.06473302841186523}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6841470003128052},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.6572460532188416},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5066271424293518},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5046504735946655},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.34961646795272827},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.16468289494514465},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.06473302841186523}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3115/v1/w14-3608","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-3608","pdf_url":"https://doi.org/10.3115/v1/w14-3608","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the EMNLP 2014 Workshop on Arabic Natural Language Processing (ANLP)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.3115/v1/w14-3608","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-3608","pdf_url":"https://doi.org/10.3115/v1/w14-3608","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the EMNLP 2014 Workshop on Arabic Natural Language Processing (ANLP)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.49000000953674316,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W2109613320","https://openalex.org/W2136534344","https://openalex.org/W2136922672","https://openalex.org/W2143719855","https://openalex.org/W2153186553"],"related_works":["https://openalex.org/W2789919619","https://openalex.org/W2901613113","https://openalex.org/W2915524904","https://openalex.org/W2293457016","https://openalex.org/W2313063416","https://openalex.org/W3169305685","https://openalex.org/W2351428524","https://openalex.org/W2368779261","https://openalex.org/W2161100657","https://openalex.org/W1551406738"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"Arabic":[3,28,75],"diacritics":[4],"restoration":[5],"problem":[6],"is":[7,39,55,78],"tackled":[8],"under":[9],"the":[10,22,95,102,120,127,132],"deep":[11,34],"learning":[12],"framework":[13,32],"presenting":[14],"Confused":[15],"Subset":[16],"Resolution":[17],"(CSR)":[18],"method":[19],"to":[20,27,41,82,106,112,115],"improve":[21],"classification":[23,104,110],"accuracy,":[24],"in":[25,61,80,124],"addition":[26,81],"Part-of-Speech":[29],"(PoS)":[30],"tagging":[31],"using":[33],"neural":[35],"nets.":[36],"Special":[37],"focus":[38],"given":[40],"syntactic":[42,103],"diacritization,":[43],"which":[44],"still":[45],"suffer":[46],"low":[47],"accuracy":[48],"as":[49],"indicated":[50],"by":[51,129],"related":[52],"works.":[53],"Evaluation":[54],"done":[56],"versus":[57],"state-of-the-art":[58],"systems":[59,135],"reported":[60,122,134],"literature,":[62,125],"with":[63],"quite":[64],"challenging":[65],"datasets,":[66],"collected":[67],"from":[68],"different":[69],"domains.":[70],"Standard":[71],"datasets":[72],"like":[73],"LDC":[74],"Tree":[76],"Bank":[77],"used":[79],"custom":[83],"ones":[84],"available":[85],"online":[86],"for":[87],"results":[88,123],"replication.":[89],"Results":[90],"show":[91],"significant":[92],"improvement":[93],"of":[94,119],"proposed":[96],"techniques":[97],"over":[98,131],"other":[99],"approaches,":[100],"reducing":[101],"error":[105,111,128],"9.9%":[107],"and":[108,117],"morphological":[109],"3%":[113],"compared":[114],"12.7%":[116],"3.8%":[118],"best":[121,133],"improving":[126],"22%":[130]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
