{"id":"https://openalex.org/W4206500717","doi":"https://doi.org/10.1007/s40747-021-00608-2","title":"ETHOS: a multi-label hate speech detection dataset","display_name":"ETHOS: a multi-label hate speech detection dataset","publication_year":2022,"publication_date":"2022-01-04","ids":{"openalex":"https://openalex.org/W4206500717","doi":"https://doi.org/10.1007/s40747-021-00608-2"},"language":"en","primary_location":{"id":"doi:10.1007/s40747-021-00608-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-021-00608-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-021-00608-2.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1007/s40747-021-00608-2.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043535730","display_name":"Ioannis Mollas","orcid":"https://orcid.org/0000-0002-7765-7903"},"institutions":[{"id":"https://openalex.org/I21370196","display_name":"Aristotle University of Thessaloniki","ror":"https://ror.org/02j61yw88","country_code":"GR","type":"education","lineage":["https://openalex.org/I21370196"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"Ioannis Mollas","raw_affiliation_strings":["Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece"],"raw_orcid":"https://orcid.org/0000-0002-7765-7903","affiliations":[{"raw_affiliation_string":"Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece","institution_ids":["https://openalex.org/I21370196"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059650033","display_name":"Zoe Chrysopoulou","orcid":null},"institutions":[{"id":"https://openalex.org/I21370196","display_name":"Aristotle University of Thessaloniki","ror":"https://ror.org/02j61yw88","country_code":"GR","type":"education","lineage":["https://openalex.org/I21370196"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Zoe Chrysopoulou","raw_affiliation_strings":["Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece","institution_ids":["https://openalex.org/I21370196"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073119708","display_name":"Stamatis Karlos","orcid":"https://orcid.org/0000-0002-5307-6186"},"institutions":[{"id":"https://openalex.org/I21370196","display_name":"Aristotle University of Thessaloniki","ror":"https://ror.org/02j61yw88","country_code":"GR","type":"education","lineage":["https://openalex.org/I21370196"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Stamatis Karlos","raw_affiliation_strings":["Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece"],"raw_orcid":"https://orcid.org/0000-0002-5307-6186","affiliations":[{"raw_affiliation_string":"Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece","institution_ids":["https://openalex.org/I21370196"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026561247","display_name":"Grigorios Tsoumakas","orcid":"https://orcid.org/0000-0002-7879-669X"},"institutions":[{"id":"https://openalex.org/I21370196","display_name":"Aristotle University of Thessaloniki","ror":"https://ror.org/02j61yw88","country_code":"GR","type":"education","lineage":["https://openalex.org/I21370196"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Grigorios Tsoumakas","raw_affiliation_strings":["Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece"],"raw_orcid":"https://orcid.org/0000-0002-7879-669X","affiliations":[{"raw_affiliation_string":"Department of Informatics, Aristotle University of Thessaloniki, Thessaloniki, Greece","institution_ids":["https://openalex.org/I21370196"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5043535730"],"corresponding_institution_ids":["https://openalex.org/I21370196"],"apc_list":{"value":1320,"currency":"GBP","value_usd":1619},"apc_paid":{"value":1320,"currency":"GBP","value_usd":1619},"fwci":13.3167,"has_fulltext":true,"cited_by_count":107,"citation_normalized_percentile":{"value":0.99031833,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"8","issue":"6","first_page":"4663","last_page":"4678"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6994731426239014},{"id":"https://openalex.org/keywords/crowdsourcing","display_name":"Crowdsourcing","score":0.6077029705047607},{"id":"https://openalex.org/keywords/offensive","display_name":"Offensive","score":0.602913498878479},{"id":"https://openalex.org/keywords/ethos","display_name":"Ethos","score":0.5766274333000183},{"id":"https://openalex.org/keywords/upload","display_name":"Upload","score":0.5529695153236389},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.551404595375061},{"id":"https://openalex.org/keywords/pace","display_name":"Pace","score":0.5350326895713806},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5320765972137451},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4993925094604492},{"id":"https://openalex.org/keywords/distrust","display_name":"Distrust","score":0.4471021592617035},{"id":"https://openalex.org/keywords/internet-privacy","display_name":"Internet privacy","score":0.43893739581108093},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.43602487444877625},{"id":"https://openalex.org/keywords/legislation","display_name":"Legislation","score":0.42984068393707275},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34718188643455505},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3083145022392273},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14021790027618408},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.1355036199092865},{"id":"https://openalex.org/keywords/law","display_name":"Law","score":0.10297432541847229},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.09710118174552917}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6994731426239014},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.6077029705047607},{"id":"https://openalex.org/C176856949","wikidata":"https://www.wikidata.org/wiki/Q2001676","display_name":"Offensive","level":2,"score":0.602913498878479},{"id":"https://openalex.org/C2776932993","wikidata":"https://www.wikidata.org/wiki/Q484318","display_name":"Ethos","level":2,"score":0.5766274333000183},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.5529695153236389},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.551404595375061},{"id":"https://openalex.org/C2777526511","wikidata":"https://www.wikidata.org/wiki/Q691543","display_name":"Pace","level":2,"score":0.5350326895713806},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5320765972137451},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4993925094604492},{"id":"https://openalex.org/C2778321746","wikidata":"https://www.wikidata.org/wiki/Q621922","display_name":"Distrust","level":2,"score":0.4471021592617035},{"id":"https://openalex.org/C108827166","wikidata":"https://www.wikidata.org/wiki/Q175975","display_name":"Internet privacy","level":1,"score":0.43893739581108093},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.43602487444877625},{"id":"https://openalex.org/C2777351106","wikidata":"https://www.wikidata.org/wiki/Q49371","display_name":"Legislation","level":2,"score":0.42984068393707275},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34718188643455505},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3083145022392273},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14021790027618408},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.1355036199092865},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.10297432541847229},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.09710118174552917},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s40747-021-00608-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-021-00608-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-021-00608-2.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s40747-021-00608-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-021-00608-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-021-00608-2.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6299999952316284,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"},{"score":0.4099999964237213,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320327859","display_name":"Hellenic Foundation for Research and Innovation","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4206500717.pdf","grobid_xml":"https://content.openalex.org/works/W4206500717.grobid-xml"},"referenced_works_count":47,"referenced_works":["https://openalex.org/W163939222","https://openalex.org/W586780102","https://openalex.org/W868043366","https://openalex.org/W1524416683","https://openalex.org/W2052684427","https://openalex.org/W2081580037","https://openalex.org/W2113046211","https://openalex.org/W2141007997","https://openalex.org/W2146241755","https://openalex.org/W2250539671","https://openalex.org/W2279689406","https://openalex.org/W2473555522","https://openalex.org/W2595653137","https://openalex.org/W2615868131","https://openalex.org/W2741065173","https://openalex.org/W2782698363","https://openalex.org/W2784010253","https://openalex.org/W2789942211","https://openalex.org/W2800543130","https://openalex.org/W2830578967","https://openalex.org/W2897495521","https://openalex.org/W2906979176","https://openalex.org/W2918540534","https://openalex.org/W2955502525","https://openalex.org/W2956090150","https://openalex.org/W2962977603","https://openalex.org/W2963532322","https://openalex.org/W2963740308","https://openalex.org/W2970921912","https://openalex.org/W2971150411","https://openalex.org/W2972944582","https://openalex.org/W2980536865","https://openalex.org/W2986273318","https://openalex.org/W2986737700","https://openalex.org/W2987103574","https://openalex.org/W3008555361","https://openalex.org/W3014188249","https://openalex.org/W3021453518","https://openalex.org/W3034202663","https://openalex.org/W3038718637","https://openalex.org/W3039169605","https://openalex.org/W3040509489","https://openalex.org/W3046195400","https://openalex.org/W3153645085","https://openalex.org/W3173628907","https://openalex.org/W4232359393","https://openalex.org/W6812880706"],"related_works":["https://openalex.org/W2152370238","https://openalex.org/W2090589575","https://openalex.org/W3193570178","https://openalex.org/W3160132286","https://openalex.org/W2136955267","https://openalex.org/W2712460288","https://openalex.org/W2352717624","https://openalex.org/W2364471629","https://openalex.org/W1499113510","https://openalex.org/W2482316195"],"abstract_inverted_index":{"Abstract":[0],"Online":[1],"hate":[2,141,240],"speech":[3,142,241],"is":[4,12,34,222],"a":[5,15,49,85,107,135,172,226,234],"recent":[6],"problem":[7],"in":[8,45,63,212,243],"our":[9,111,118,125,210],"society":[10],"that":[11,26],"rising":[13],"at":[14],"steady":[16],"pace":[17],"by":[18,37],"leveraging":[19],"the":[20,23,46,80,100,137,148,189,196,215,244],"vulnerabilities":[21],"of":[22,48,60,88,102,117,139,229],"corresponding":[24,81],"regimes":[25],"characterise":[27],"most":[28],"social":[29,126],"media":[30],"platforms.":[31],"This":[32],"phenomenon":[33],"primarily":[35],"fostered":[36],"offensive":[38],"comments,":[39],"either":[40],"during":[41],"user":[42,150],"interaction":[43],"or":[44],"form":[47],"posted":[50],"multimedia":[51],"context.":[52],"Nowadays,":[53],"giant":[54],"corporations":[55],"own":[56],"platforms":[57],"where":[58],"millions":[59],"users":[61],"log":[62],"every":[64],"day,":[65],"and":[66,83,93,98,179,184],"protection":[67],"from":[68,232],"exposure":[69],"to":[70,74,77,124,131,200,214],"similar":[71],"phenomena":[72],"appears":[73],"be":[75],"necessary":[76],"comply":[78],"with":[79,175],"legislation":[82],"maintain":[84],"high":[86],"level":[87],"service":[89],"quality.":[90],"A":[91],"robust":[92],"reliable":[94],"system":[95],"for":[96,208],"detecting":[97],"preventing":[99],"uploading":[101],"relevant":[103],"content":[104],"will":[105],"have":[106],"significant":[108],"impact":[109],"on":[110,182],"digitally":[112],"interconnected":[113],"society.":[114],"Several":[115],"aspects":[116,217],"daily":[119],"lives":[120],"are":[121],"undeniably":[122],"linked":[123],"profiles,":[127],"making":[128],"us":[129],"vulnerable":[130],"abusive":[132],"behaviours.":[133],"As":[134],"result,":[136],"lack":[138],"accurate":[140],"detection":[143],"mechanisms":[144],"would":[145,156],"severely":[146],"degrade":[147],"overall":[149],"experience,":[151],"although":[152],"its":[153],"erroneous":[154],"operation":[155],"pose":[157],"many":[158],"ethical":[159],"concerns.":[160],"In":[161],"this":[162,202],"paper,":[163],"we":[164,194,237],"present":[165,195],"\u2018ETHOS\u2019":[166],"(multi-labEl":[167],"haTe":[168],"speecH":[169],"detectiOn":[170],"dataSet),":[171],"textual":[173],"dataset":[174],"two":[176],"variants:":[177],"binary":[178],"multi-label,":[180],"based":[181],"YouTube":[183],"Reddit":[185],"comments":[186],"validated":[187],"using":[188],"Figure-Eight":[190],"crowdsourcing":[191],"platform.":[192],"Furthermore,":[193],"annotation":[197],"protocol":[198],"used":[199],"create":[201],"dataset:":[203],"an":[204],"active":[205],"sampling":[206],"procedure":[207],"balancing":[209],"data":[211,231],"relation":[213],"various":[216],"defined.":[218],"Our":[219],"key":[220],"assumption":[221],"that,":[223],"even":[224],"gaining":[225],"small":[227],"amount":[228],"labelled":[230],"such":[233],"time-consuming":[235],"process,":[236],"can":[238],"guarantee":[239],"occurrences":[242],"examined":[245],"material.":[246]},"counts_by_year":[{"year":2026,"cited_by_count":11},{"year":2025,"cited_by_count":29},{"year":2024,"cited_by_count":23},{"year":2023,"cited_by_count":28},{"year":2022,"cited_by_count":16}],"updated_date":"2026-04-28T14:05:53.105641","created_date":"2022-01-26T00:00:00"}
