{"id":"https://openalex.org/W2740918723","doi":"https://doi.org/10.18653/v1/w17-1316","title":"Arabic POS Tagging: Don't Abandon Feature Engineering Just Yet","display_name":"Arabic POS Tagging: Don't Abandon Feature Engineering Just Yet","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2740918723","doi":"https://doi.org/10.18653/v1/w17-1316","mag":"2740918723"},"language":"en","primary_location":{"id":"doi:10.18653/v1/w17-1316","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-1316","pdf_url":"https://www.aclweb.org/anthology/W17-1316.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Third Arabic Natural Language Processing Workshop","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/W17-1316.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111452036","display_name":"Kareem Darwish","orcid":null},"institutions":[{"id":"https://openalex.org/I4210138380","display_name":"Qatar Cardiovascular Research Center","ror":"https://ror.org/038vyt185","country_code":"QA","type":"healthcare","lineage":["https://openalex.org/I4210138380"]}],"countries":["QA"],"is_corresponding":true,"raw_author_name":"Kareem Darwish","raw_affiliation_strings":["Qatar Computing Research Institute (QCRI) HBKU, Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute (QCRI) HBKU, Doha, Qatar","institution_ids":["https://openalex.org/I4210138380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102924560","display_name":"Hamdy Mubarak","orcid":"https://orcid.org/0000-0002-9051-6240"},"institutions":[{"id":"https://openalex.org/I4210138380","display_name":"Qatar Cardiovascular Research Center","ror":"https://ror.org/038vyt185","country_code":"QA","type":"healthcare","lineage":["https://openalex.org/I4210138380"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Hamdy Mubarak","raw_affiliation_strings":["Qatar Computing Research Institute (QCRI) HBKU, Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute (QCRI) HBKU, Doha, Qatar","institution_ids":["https://openalex.org/I4210138380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047182137","display_name":"Ahmed Abdelal\u00ed","orcid":"https://orcid.org/0000-0002-4160-8181"},"institutions":[{"id":"https://openalex.org/I4210138380","display_name":"Qatar Cardiovascular Research Center","ror":"https://ror.org/038vyt185","country_code":"QA","type":"healthcare","lineage":["https://openalex.org/I4210138380"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Ahmed Abdelali","raw_affiliation_strings":["Qatar Computing Research Institute (QCRI) HBKU, Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute (QCRI) HBKU, Doha, Qatar","institution_ids":["https://openalex.org/I4210138380"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033221342","display_name":"Mohamed Eldesouki","orcid":"https://orcid.org/0009-0009-6662-5883"},"institutions":[{"id":"https://openalex.org/I4210138380","display_name":"Qatar Cardiovascular Research Center","ror":"https://ror.org/038vyt185","country_code":"QA","type":"healthcare","lineage":["https://openalex.org/I4210138380"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Mohamed Eldesouki","raw_affiliation_strings":["Qatar Computing Research Institute (QCRI) HBKU, Doha, Qatar"],"affiliations":[{"raw_affiliation_string":"Qatar Computing Research Institute (QCRI) HBKU, Doha, Qatar","institution_ids":["https://openalex.org/I4210138380"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5111452036"],"corresponding_institution_ids":["https://openalex.org/I4210138380"],"apc_list":null,"apc_paid":null,"fwci":3.1203,"has_fulltext":true,"cited_by_count":32,"citation_normalized_percentile":{"value":0.93399844,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7910279631614685},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.7764842510223389},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.7312475442886353},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.7118592858314514},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6925018429756165},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.650188148021698},{"id":"https://openalex.org/keywords/feature-engineering","display_name":"Feature engineering","score":0.6323021054267883},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5486810207366943},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5207214951515198},{"id":"https://openalex.org/keywords/arabic","display_name":"Arabic","score":0.5159466862678528},{"id":"https://openalex.org/keywords/ranking-svm","display_name":"Ranking SVM","score":0.5152769088745117},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.46842801570892334},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.44882306456565857},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.44261297583580017},{"id":"https://openalex.org/keywords/sequence-labeling","display_name":"Sequence labeling","score":0.42159533500671387},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4201483428478241},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37919339537620544},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.25435972213745117},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0856313407421112},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.06770408153533936},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.06561276316642761}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7910279631614685},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.7764842510223389},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.7312475442886353},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.7118592858314514},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6925018429756165},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.650188148021698},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.6323021054267883},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5486810207366943},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5207214951515198},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.5159466862678528},{"id":"https://openalex.org/C124975894","wikidata":"https://www.wikidata.org/wiki/Q7293290","display_name":"Ranking SVM","level":3,"score":0.5152769088745117},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.46842801570892334},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.44882306456565857},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.44261297583580017},{"id":"https://openalex.org/C35639132","wikidata":"https://www.wikidata.org/wiki/Q7452468","display_name":"Sequence labeling","level":3,"score":0.42159533500671387},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4201483428478241},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37919339537620544},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.25435972213745117},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0856313407421112},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.06770408153533936},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.06561276316642761},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/w17-1316","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-1316","pdf_url":"https://www.aclweb.org/anthology/W17-1316.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Third Arabic Natural Language Processing Workshop","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/w17-1316","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-1316","pdf_url":"https://www.aclweb.org/anthology/W17-1316.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Third Arabic Natural Language Processing Workshop","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2740918723.pdf","grobid_xml":"https://content.openalex.org/works/W2740918723.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W4758264","https://openalex.org/W162171320","https://openalex.org/W196214544","https://openalex.org/W1576227399","https://openalex.org/W1899794420","https://openalex.org/W2035720976","https://openalex.org/W2064675550","https://openalex.org/W2140090592","https://openalex.org/W2141599568","https://openalex.org/W2151690415","https://openalex.org/W2229177960","https://openalex.org/W2231920551","https://openalex.org/W2250283392","https://openalex.org/W2250816155","https://openalex.org/W2413317570","https://openalex.org/W2471147443","https://openalex.org/W2492083338","https://openalex.org/W2575598244","https://openalex.org/W2949563612","https://openalex.org/W2964090065","https://openalex.org/W3122775348","https://openalex.org/W4285719527","https://openalex.org/W4293374342"],"related_works":["https://openalex.org/W2894378449","https://openalex.org/W4298061178","https://openalex.org/W4387022695","https://openalex.org/W2295030615","https://openalex.org/W2787518671","https://openalex.org/W3012125532","https://openalex.org/W3047727388","https://openalex.org/W2590462354","https://openalex.org/W2900788028","https://openalex.org/W2990142167"],"abstract_inverted_index":{"This":[0],"paper":[1],"focuses":[2],"on":[3],"comparing":[4],"between":[5],"using":[6,97],"Support":[7],"Vector":[8],"Machine":[9],"based":[10,20,120],"ranking":[11],"(SVM":[12],"Rank":[13,33,116],")":[14],"and":[15,117],"Bidirectional":[16],"Long-Short-Term-Memory":[17],"(bi-LSTM)":[18],"neuralnetwork":[19],"sequence":[21,72],"labeling":[22,73],"in":[23],"building":[24],"a":[25,40],"state-of-the-art":[26,36],"Arabic":[27],"part-ofspeech":[28],"tagging":[29],"system.":[30],"Using":[31,46],"SVM":[32,84,115],"leads":[34],"to":[35,56,88,108],"results,":[37],"but":[38],"with":[39,51,74,103],"fair":[41],"amount":[42],"of":[43,76],"feature":[44],"engineering.":[45],"bi-LSTM,":[47],"particularly":[48],"when":[49],"combined":[50],"word":[52],"embeddings,":[53],"may":[54,99],"lead":[55],"competitive":[57],"POS-tagging":[58],"results":[59],"by":[60],"automatically":[61],"deducing":[62],"latent":[63],"linguistic":[64],"features.":[65,109],"However,":[66],"we":[67,80],"show":[68,93],"that":[69,79,94],"augmenting":[70],"bi-LSTM":[71,119],"some":[75],"the":[77,83,104,114,118,123],"features":[78],"used":[81],"for":[82,122],"Rankbased":[85],"tagger":[86],"yields":[87],"further":[89],"improvements.":[90],"We":[91,110],"also":[92],"gains":[95,105],"realized":[96],"embeddings":[98],"not":[100],"be":[101],"additive":[102],"achieved":[106],"due":[107],"are":[111],"open-sourcing":[112],"both":[113],"systems":[121],"research":[124],"community.":[125]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
