{"id":"https://openalex.org/W2251948394","doi":"https://doi.org/10.3115/v1/w14-5813","title":"Collaboratively Constructed Linguistic Resources for Language Variants and their Exploitation in NLP Application \u2013 the case of Tunisian Arabic and the Social Media","display_name":"Collaboratively Constructed Linguistic Resources for Language Variants and their Exploitation in NLP Application \u2013 the case of Tunisian Arabic and the Social Media","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2251948394","doi":"https://doi.org/10.3115/v1/w14-5813","mag":"2251948394"},"language":"en","primary_location":{"id":"doi:10.3115/v1/w14-5813","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-5813","pdf_url":"https://aclanthology.org/W14-5813.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of Workshop on Lexical and Grammatical Resources for Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/W14-5813.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030866856","display_name":"Fatiha Sadat","orcid":"https://orcid.org/0000-0002-9292-722X"},"institutions":[{"id":"https://openalex.org/I142899784","display_name":"University of Sfax","ror":"https://ror.org/04d4sd432","country_code":"TN","type":"education","lineage":["https://openalex.org/I142899784"]},{"id":"https://openalex.org/I49663120","display_name":"Universit\u00e9 du Qu\u00e9bec","ror":"https://ror.org/010gxg263","country_code":"CA","type":"education","lineage":["https://openalex.org/I49663120"]}],"countries":["CA","TN"],"is_corresponding":true,"raw_author_name":"Fatiha Sadat","raw_affiliation_strings":["NLP Technologies Inc. 52 LeRoyer Street W, Montreal, Canada","Rahma Sellami Sfax University, Sfax, Tunisia","University of Quebec in Mon-treal 201 President Kennedy, Mon-treal, QC, Canada","Sfax University, Sfax, Tunisia"],"affiliations":[{"raw_affiliation_string":"NLP Technologies Inc. 52 LeRoyer Street W, Montreal, Canada","institution_ids":[]},{"raw_affiliation_string":"Rahma Sellami Sfax University, Sfax, Tunisia","institution_ids":[]},{"raw_affiliation_string":"University of Quebec in Mon-treal 201 President Kennedy, Mon-treal, QC, Canada","institution_ids":["https://openalex.org/I49663120"]},{"raw_affiliation_string":"Sfax University, Sfax, Tunisia","institution_ids":["https://openalex.org/I142899784"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011813721","display_name":"Fatma Mallek","orcid":null},"institutions":[{"id":"https://openalex.org/I142899784","display_name":"University of Sfax","ror":"https://ror.org/04d4sd432","country_code":"TN","type":"education","lineage":["https://openalex.org/I142899784"]},{"id":"https://openalex.org/I49663120","display_name":"Universit\u00e9 du Qu\u00e9bec","ror":"https://ror.org/010gxg263","country_code":"CA","type":"education","lineage":["https://openalex.org/I49663120"]}],"countries":["CA","TN"],"is_corresponding":false,"raw_author_name":"Fatma Mallek","raw_affiliation_strings":["Sfax University, Sfax, Tunisia","Rahma Sellami Sfax University, Sfax, Tunisia","NLP Technologies Inc. 52 LeRoyer Street W, Montreal, Canada","University of Quebec in Mon-treal 201 President Kennedy, Mon-treal, QC, Canada"],"affiliations":[{"raw_affiliation_string":"Sfax University, Sfax, Tunisia","institution_ids":["https://openalex.org/I142899784"]},{"raw_affiliation_string":"Rahma Sellami Sfax University, Sfax, Tunisia","institution_ids":[]},{"raw_affiliation_string":"NLP Technologies Inc. 52 LeRoyer Street W, Montreal, Canada","institution_ids":[]},{"raw_affiliation_string":"University of Quebec in Mon-treal 201 President Kennedy, Mon-treal, QC, Canada","institution_ids":["https://openalex.org/I49663120"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007861658","display_name":"Mohamed Mahdi Boudabous","orcid":"https://orcid.org/0009-0003-9601-0632"},"institutions":[{"id":"https://openalex.org/I142899784","display_name":"University of Sfax","ror":"https://ror.org/04d4sd432","country_code":"TN","type":"education","lineage":["https://openalex.org/I142899784"]},{"id":"https://openalex.org/I49663120","display_name":"Universit\u00e9 du Qu\u00e9bec","ror":"https://ror.org/010gxg263","country_code":"CA","type":"education","lineage":["https://openalex.org/I49663120"]}],"countries":["CA","TN"],"is_corresponding":false,"raw_author_name":"Mohamed Boudabous","raw_affiliation_strings":["Sfax University, Sfax, Tunisia","NLP Technologies Inc. 52 LeRoyer Street W, Montreal, Canada","Rahma Sellami Sfax University, Sfax, Tunisia","University of Quebec in Mon-treal 201 President Kennedy, Mon-treal, QC, Canada"],"affiliations":[{"raw_affiliation_string":"Sfax University, Sfax, Tunisia","institution_ids":["https://openalex.org/I142899784"]},{"raw_affiliation_string":"NLP Technologies Inc. 52 LeRoyer Street W, Montreal, Canada","institution_ids":[]},{"raw_affiliation_string":"Rahma Sellami Sfax University, Sfax, Tunisia","institution_ids":[]},{"raw_affiliation_string":"University of Quebec in Mon-treal 201 President Kennedy, Mon-treal, QC, Canada","institution_ids":["https://openalex.org/I49663120"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077074796","display_name":"Rahma Sellami","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rahma Sellami","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5045732893","display_name":"Atefeh Farzindar","orcid":null},"institutions":[{"id":"https://openalex.org/I142899784","display_name":"University of Sfax","ror":"https://ror.org/04d4sd432","country_code":"TN","type":"education","lineage":["https://openalex.org/I142899784"]},{"id":"https://openalex.org/I49663120","display_name":"Universit\u00e9 du Qu\u00e9bec","ror":"https://ror.org/010gxg263","country_code":"CA","type":"education","lineage":["https://openalex.org/I49663120"]}],"countries":["CA","TN"],"is_corresponding":false,"raw_author_name":"Atefeh Farzindar","raw_affiliation_strings":["NLP Technologies Inc. 52 LeRoyer Street W, Montreal, Canada","Sfax University, Sfax, Tunisia","University of Quebec in Mon-treal 201 President Kennedy, Mon-treal, QC, Canada","Rahma Sellami Sfax University, Sfax, Tunisia"],"affiliations":[{"raw_affiliation_string":"NLP Technologies Inc. 52 LeRoyer Street W, Montreal, Canada","institution_ids":[]},{"raw_affiliation_string":"Sfax University, Sfax, Tunisia","institution_ids":["https://openalex.org/I142899784"]},{"raw_affiliation_string":"University of Quebec in Mon-treal 201 President Kennedy, Mon-treal, QC, Canada","institution_ids":["https://openalex.org/I49663120"]},{"raw_affiliation_string":"Rahma Sellami Sfax University, Sfax, Tunisia","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5030866856"],"corresponding_institution_ids":["https://openalex.org/I142899784","https://openalex.org/I49663120"],"apc_list":null,"apc_paid":null,"fwci":2.9419,"has_fulltext":true,"cited_by_count":25,"citation_normalized_percentile":{"value":0.92420283,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9855999946594238,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10759","display_name":"Translation Studies and Practices","score":0.982200026512146,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7287658452987671},{"id":"https://openalex.org/keywords/lexicon","display_name":"Lexicon","score":0.6930255889892578},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6688157916069031},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.6506799459457397},{"id":"https://openalex.org/keywords/arabic","display_name":"Arabic","score":0.6445900201797485},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.6227797269821167},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5819939374923706},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.5662152767181396},{"id":"https://openalex.org/keywords/modern-standard-arabic","display_name":"Modern Standard Arabic","score":0.46097153425216675},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.1156674325466156}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7287658452987671},{"id":"https://openalex.org/C2778121359","wikidata":"https://www.wikidata.org/wiki/Q8096","display_name":"Lexicon","level":2,"score":0.6930255889892578},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6688157916069031},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.6506799459457397},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.6445900201797485},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.6227797269821167},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5819939374923706},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.5662152767181396},{"id":"https://openalex.org/C2778243841","wikidata":"https://www.wikidata.org/wiki/Q56467","display_name":"Modern Standard Arabic","level":3,"score":0.46097153425216675},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.1156674325466156},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3115/v1/w14-5813","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-5813","pdf_url":"https://aclanthology.org/W14-5813.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of Workshop on Lexical and Grammatical Resources for Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.3115/v1/w14-5813","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-5813","pdf_url":"https://aclanthology.org/W14-5813.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of Workshop on Lexical and Grammatical Resources for Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8100000023841858,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2251948394.pdf","grobid_xml":"https://content.openalex.org/works/W2251948394.grobid-xml"},"referenced_works_count":22,"referenced_works":["https://openalex.org/W78842653","https://openalex.org/W137989762","https://openalex.org/W1544567521","https://openalex.org/W1631260214","https://openalex.org/W1895315011","https://openalex.org/W1957504465","https://openalex.org/W1970902588","https://openalex.org/W1977195462","https://openalex.org/W1978174332","https://openalex.org/W2097743493","https://openalex.org/W2101105183","https://openalex.org/W2135161317","https://openalex.org/W2156554947","https://openalex.org/W2168576900","https://openalex.org/W2250862217","https://openalex.org/W2251147480","https://openalex.org/W2251986002","https://openalex.org/W2411190207","https://openalex.org/W2610671394","https://openalex.org/W2617702252","https://openalex.org/W3166879702","https://openalex.org/W3170253630"],"related_works":["https://openalex.org/W4243485167","https://openalex.org/W2620283452","https://openalex.org/W4322750817","https://openalex.org/W4245232085","https://openalex.org/W2801712537","https://openalex.org/W587642979","https://openalex.org/W2250668514","https://openalex.org/W2894059694","https://openalex.org/W3173761424","https://openalex.org/W4299493485"],"abstract_inverted_index":{"Modern":[0],"Standard":[1],"Arabic":[2,10,12,28,76,144],"(MSA)":[3],"is":[4,133],"the":[5,48,59,72,148],"formal":[6],"language":[7,17,121],"in":[8,22,117],"most":[9,27],"countries.":[11],"Dialects":[13],"(AD)":[14],"or":[15],"daily":[16],"differs":[18],"from":[19],"MSA":[20,40,51,91,125],"especially":[21,38],"social":[23,29,64,87],"media":[24,30,88],"communication.":[25],"However,":[26],"texts":[31,62],"have":[32],"mixed":[33],"forms":[34],"and":[35,41,52,92,105,115,140],"many":[36],"variations":[37],"between":[39,50],"AD.":[42],"This":[43,131],"paper":[44,69],"aims":[45],"to":[46,119,123],"bridge":[47],"gap":[49],"AD":[53],"by":[54],"providing":[55],"a":[56,86,101,106,120,134],"framework":[57],"for":[58,85,143],"translation":[60,84],"of":[61,63,75,108,127],"media.":[65],"More":[66],"precisely,":[67],"this":[68],"focuses":[70],"on":[71,81],"Tunisian":[73,128],"Dialect":[74],"(TAD)":[77],"with":[78],"an":[79],"application":[80],"automatic":[82],"machine":[83],"text":[89],"into":[90],"any":[93],"other":[94],"target":[95],"language.":[96],"Linguistic":[97],"tools":[98],"such":[99],"as":[100],"bilingual":[102],"TAD-MSA":[103],"lexicon":[104],"set":[107],"grammatical":[109],"mapping":[110],"rules":[111],"are":[112],"collaboratively":[113,137],"constructed":[114,138],"exploited":[116],"addition":[118],"model":[122],"produce":[124],"sentences":[126],"dialectal":[129],"sentences.":[130],"work":[132],"first-step":[135],"towards":[136],"semantic":[139],"lexical":[141],"resources":[142],"Social":[145,151],"Media":[146,152],"within":[147],"ASMAT":[149],"(Arabic":[150],"Analysis":[153],"Tools)":[154],"project.":[155]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
