{"id":"https://openalex.org/W4406450848","doi":"https://doi.org/10.48550/arxiv.2501.08284","title":"AfriHate: A Multilingual Collection of Hate Speech and Abusive Language Datasets for African Languages","display_name":"AfriHate: A Multilingual Collection of Hate Speech and Abusive Language Datasets for African Languages","publication_year":2025,"publication_date":"2025-01-14","ids":{"openalex":"https://openalex.org/W4406450848","doi":"https://doi.org/10.48550/arxiv.2501.08284"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2501.08284","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.08284","pdf_url":"https://arxiv.org/pdf/2501.08284","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2501.08284","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002849148","display_name":"Shamsuddeen Hassan Muhammad","orcid":"https://orcid.org/0000-0001-7708-0799"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Muhammad, Shamsuddeen Hassan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054346112","display_name":"Idris Abdulmumin","orcid":"https://orcid.org/0000-0002-3795-8381"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abdulmumin, Idris","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071390079","display_name":"Abinew Ali Ayele","orcid":"https://orcid.org/0000-0003-4686-5053"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ayele, Abinew Ali","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088658365","display_name":"David Ifeoluwa Adelani","orcid":"https://orcid.org/0000-0002-0193-2083"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Adelani, David Ifeoluwa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023958796","display_name":"Ibrahim Said Ahmad","orcid":"https://orcid.org/0000-0001-9514-1807"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmad, Ibrahim Said","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026042314","display_name":"Saminu Mohammad Aliyu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aliyu, Saminu Mohammad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115903002","display_name":"Nelson Odhiambo Onyango","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Onyango, Nelson Odhiambo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041771996","display_name":"Lilian Wanzare","orcid":"https://orcid.org/0000-0002-6718-900X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wanzare, Lilian D. A.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012177273","display_name":"Samuel Rutunda","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rutunda, Samuel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093321339","display_name":"Lukman Jibril Aliyu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aliyu, Lukman Jibril","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079210242","display_name":"Esubalew Alemneh","orcid":"https://orcid.org/0000-0002-1970-3537"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alemneh, Esubalew","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055885995","display_name":"Oumaima Hourrane","orcid":"https://orcid.org/0000-0002-5697-9874"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hourrane, Oumaima","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038187456","display_name":"Hagos Tesfahun Gebremichael","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gebremichael, Hagos Tesfahun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Ismail, Elyas Abdi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ismail, Elyas Abdi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051998921","display_name":"Meriem Beloucif","orcid":"https://orcid.org/0000-0002-4659-759X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Beloucif, Meriem","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008150617","display_name":"Ebrahim Chekol Jibril","orcid":"https://orcid.org/0000-0002-9891-9562"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jibril, Ebrahim Chekol","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004241641","display_name":"Andiswa Bukula","orcid":"https://orcid.org/0000-0002-6667-4599"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bukula, Andiswa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076520827","display_name":"Rooweither Mabuya","orcid":"https://orcid.org/0000-0001-6658-975X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mabuya, Rooweither","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010053988","display_name":"Salomey Osei","orcid":"https://orcid.org/0000-0003-1900-3124"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Osei, Salomey","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032216931","display_name":"Abigail Oppong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oppong, Abigail","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040546523","display_name":"Tadesse Destaw Belay","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Belay, Tadesse Destaw","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007629765","display_name":"Tadesse Kebede Guge","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guge, Tadesse Kebede","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079615141","display_name":"Tesfa Tegegne Asfaw","orcid":"https://orcid.org/0000-0003-0392-9088"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Asfaw, Tesfa Tegegne","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012284465","display_name":"Chiamaka Ijeoma Chukwuneke","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chukwuneke, Chiamaka Ijeoma","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050023117","display_name":"Paul R\u00f6ttger","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"R\u00f6ttger, Paul","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039544387","display_name":"Seid Muhie Yimam","orcid":"https://orcid.org/0000-0002-8289-388X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yimam, Seid Muhie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5050190445","display_name":"Nedjma Ousidhoum","orcid":"https://orcid.org/0000-0003-3015-4759"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ousidhoum, Nedjma","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":27,"corresponding_author_ids":["https://openalex.org/A5002849148"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5571423172950745},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.540318489074707},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3806780278682709},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.3214242458343506}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5571423172950745},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.540318489074707},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3806780278682709},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.3214242458343506},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2501.08284","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.08284","pdf_url":"https://arxiv.org/pdf/2501.08284","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2501.08284","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2501.08284","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2501.08284","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.08284","pdf_url":"https://arxiv.org/pdf/2501.08284","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1778956461","display_name":"Incorporating Demographic Factors into Natural Language Processing Models","funder_award_id":"949944","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G3514550006","display_name":null,"funder_award_id":"Centre","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G4812237278","display_name":null,"funder_award_id":"Canada","funder_id":"https://openalex.org/F4320319949","funder_display_name":"International Development Research Centre"},{"id":"https://openalex.org/G7842005466","display_name":null,"funder_award_id":"Horizon 2020","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8318064016","display_name":null,"funder_award_id":"Horizon","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320306149","display_name":"Rockefeller Foundation","ror":"https://ror.org/03sfkwk85"},{"id":"https://openalex.org/F4320317153","display_name":"DeepMind","ror":"https://ror.org/00971b260"},{"id":"https://openalex.org/F4320319949","display_name":"International Development Research Centre","ror":"https://ror.org/0445x0472"},{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320323381","display_name":"Universit\u00e4t Hamburg","ror":"https://ror.org/00g30e956"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4406450848.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Hate":[0],"speech":[1,69,117,168],"and":[2,17,38,66,91,102,118,151,158,166,169],"abusive":[3,119],"language":[4,120,171],"are":[5,78,173],"global":[6],"phenomena":[7],"that":[8],"need":[9],"socio-cultural":[10],"background":[11],"knowledge":[12],"to":[13,42,81,94,145],"be":[14],"understood,":[15],"identified,":[16],"moderated.":[18],"However,":[19],"in":[20,87,98,122,128],"many":[21],"regions":[22],"of":[23,33,36,49,60,84,115,148],"the":[24,43,58,61,82,88,92,99,137,142,146,149],"Global":[25],"South,":[26],"there":[27],"have":[28,54,73],"been":[29,56,74],"several":[30],"documented":[31],"occurrences":[32],"(1)":[34],"absence":[35],"moderation":[37,62,103],"(2)":[39],"censorship":[40],"due":[41,80],"reliance":[44],"on":[45,175],"keyword":[46],"spotting":[47],"out":[48],"context.":[50],"Further,":[51],"high-profile":[52],"individuals":[53],"frequently":[55],"at":[57],"center":[59],"process,":[63],"while":[64],"large":[65],"targeted":[67],"hate":[68,116,167],"campaigns":[70],"against":[71],"minorities":[72],"overlooked.":[75],"These":[76],"limitations":[77],"mainly":[79],"lack":[83],"high-quality":[85],"data":[86],"local":[89,96,138],"languages":[90],"failure":[93],"include":[95],"communities":[97],"collection,":[100],"annotation,":[101],"processes.":[104],"To":[105],"address":[106],"this":[107],"issue,":[108],"we":[109],"present":[110,152],"AfriHate:":[111],"a":[112],"multilingual":[113],"collection":[114],"datasets":[121,150],"15":[123],"African":[124],"languages.":[125],"Each":[126],"instance":[127],"AfriHate":[129],"is":[130],"annotated":[131],"by":[132],"native":[133],"speakers":[134],"familiar":[135],"with":[136,157],"culture.":[139],"We":[140],"report":[141],"challenges":[143],"related":[144],"construction":[147],"various":[153],"classification":[154],"baseline":[155],"results":[156],"without":[159],"using":[160],"LLMs.":[161],"The":[162],"datasets,":[163],"individual":[164],"annotations,":[165],"offensive":[170],"lexicons":[172],"available":[174],"https://github.com/AfriHate/AfriHate":[176]},"counts_by_year":[],"updated_date":"2026-04-19T08:26:33.389920","created_date":"2025-10-10T00:00:00"}
