{"id":"https://openalex.org/W4393406903","doi":"https://doi.org/10.1109/aiccsa59173.2023.10479258","title":"Offensive Hebrew Corpus and Detection using BERT","display_name":"Offensive Hebrew Corpus and Detection using BERT","publication_year":2023,"publication_date":"2023-12-04","ids":{"openalex":"https://openalex.org/W4393406903","doi":"https://doi.org/10.1109/aiccsa59173.2023.10479258"},"language":"en","primary_location":{"id":"doi:10.1109/aiccsa59173.2023.10479258","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/aiccsa59173.2023.10479258","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 20th ACS/IEEE International Conference on Computer Systems and Applications (AICCSA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113392243","display_name":"Nagham Hamad","orcid":null},"institutions":[{"id":"https://openalex.org/I94800806","display_name":"Birzeit University","ror":"https://ror.org/0256kw398","country_code":"PS","type":"education","lineage":["https://openalex.org/I94800806"]}],"countries":["PS"],"is_corresponding":true,"raw_author_name":"Nagham Hamad","raw_affiliation_strings":["Birzeit University,Palestine","Birzeit University, Palestine"],"affiliations":[{"raw_affiliation_string":"Birzeit University,Palestine","institution_ids":["https://openalex.org/I94800806"]},{"raw_affiliation_string":"Birzeit University, Palestine","institution_ids":["https://openalex.org/I94800806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050418400","display_name":"Mustafa Jarrar","orcid":"https://orcid.org/0000-0003-4351-4207"},"institutions":[{"id":"https://openalex.org/I94800806","display_name":"Birzeit University","ror":"https://ror.org/0256kw398","country_code":"PS","type":"education","lineage":["https://openalex.org/I94800806"]}],"countries":["PS"],"is_corresponding":false,"raw_author_name":"Mustafa Jarrar","raw_affiliation_strings":["Birzeit University,Palestine","Birzeit University, Palestine"],"affiliations":[{"raw_affiliation_string":"Birzeit University,Palestine","institution_ids":["https://openalex.org/I94800806"]},{"raw_affiliation_string":"Birzeit University, Palestine","institution_ids":["https://openalex.org/I94800806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032535740","display_name":"Mohammad Khalilia","orcid":null},"institutions":[{"id":"https://openalex.org/I94800806","display_name":"Birzeit University","ror":"https://ror.org/0256kw398","country_code":"PS","type":"education","lineage":["https://openalex.org/I94800806"]}],"countries":["PS"],"is_corresponding":false,"raw_author_name":"Mohammad Khalilia","raw_affiliation_strings":["Birzeit University,Palestine","Birzeit University, Palestine"],"affiliations":[{"raw_affiliation_string":"Birzeit University,Palestine","institution_ids":["https://openalex.org/I94800806"]},{"raw_affiliation_string":"Birzeit University, Palestine","institution_ids":["https://openalex.org/I94800806"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5092828995","display_name":"Nadim Nashif","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nadim Nashif","raw_affiliation_strings":["7amleh Center,Palestine","7amleh Center, Palestine"],"affiliations":[{"raw_affiliation_string":"7amleh Center,Palestine","institution_ids":[]},{"raw_affiliation_string":"7amleh Center, Palestine","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5113392243"],"corresponding_institution_ids":["https://openalex.org/I94800806"],"apc_list":null,"apc_paid":null,"fwci":0.5112,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.73594442,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/offensive","display_name":"Offensive","score":0.8972471356391907},{"id":"https://openalex.org/keywords/hebrew","display_name":"Hebrew","score":0.7003214359283447},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5768597722053528},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45608067512512207},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4010826349258423},{"id":"https://openalex.org/keywords/art","display_name":"Art","score":0.19799676537513733},{"id":"https://openalex.org/keywords/literature","display_name":"Literature","score":0.1505776047706604},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11978912353515625},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.06489244103431702}],"concepts":[{"id":"https://openalex.org/C176856949","wikidata":"https://www.wikidata.org/wiki/Q2001676","display_name":"Offensive","level":2,"score":0.8972471356391907},{"id":"https://openalex.org/C91304198","wikidata":"https://www.wikidata.org/wiki/Q9288","display_name":"Hebrew","level":2,"score":0.7003214359283447},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5768597722053528},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45608067512512207},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4010826349258423},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.19799676537513733},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.1505776047706604},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11978912353515625},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.06489244103431702}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/aiccsa59173.2023.10479258","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/aiccsa59173.2023.10479258","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 20th ACS/IEEE International Conference on Computer Systems and Applications (AICCSA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W2031238627","https://openalex.org/W2560280095","https://openalex.org/W2612649659","https://openalex.org/W2747187574","https://openalex.org/W2791345409","https://openalex.org/W2896457183","https://openalex.org/W2898401058","https://openalex.org/W2917435974","https://openalex.org/W2919234748","https://openalex.org/W2922580172","https://openalex.org/W2948902769","https://openalex.org/W2962977603","https://openalex.org/W2963943967","https://openalex.org/W3008110149","https://openalex.org/W3035390927","https://openalex.org/W3087096149","https://openalex.org/W3087777115","https://openalex.org/W3114605654","https://openalex.org/W3115489948","https://openalex.org/W3115903740","https://openalex.org/W3116140977","https://openalex.org/W3121384227","https://openalex.org/W3126181281","https://openalex.org/W3133440961","https://openalex.org/W3149627794","https://openalex.org/W3154147337","https://openalex.org/W3213358601","https://openalex.org/W4225001692","https://openalex.org/W4281673713","https://openalex.org/W4378195111","https://openalex.org/W4385723172","https://openalex.org/W6774526564","https://openalex.org/W6775319986","https://openalex.org/W6788194588","https://openalex.org/W6791397626","https://openalex.org/W6793818051","https://openalex.org/W6810122608","https://openalex.org/W6838679636","https://openalex.org/W6838992615"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W1568520348","https://openalex.org/W3214407891","https://openalex.org/W3194113117","https://openalex.org/W3213194066","https://openalex.org/W4287020359","https://openalex.org/W268355439","https://openalex.org/W2967125893","https://openalex.org/W4385323698","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Offensive":[0],"language":[1,29],"detection":[2],"has":[3],"been":[4],"well":[5],"studied":[6],"in":[7,15,31],"many":[8],"languages,":[9,17],"but":[10],"it":[11],"is":[12,71],"lagging":[13],"behind":[14],"low-resource":[16],"such":[18],"as":[19,68],"Hebrew.":[20,32],"In":[21],"this":[22],"paper,":[23],"we":[24],"present":[25],"a":[26],"new":[27],"offensive":[28],"corpus":[30],"A":[33],"total":[34],"of":[35,49,87],"15,881":[36],"tweets":[37],"were":[38],"retrieved":[39],"from":[40],"Twitter.":[41],"Each":[42],"was":[43,66],"labeled":[44],"with":[45,76,119],"one":[46],"or":[47,56],"more":[48],"five":[50],"classes":[51],"(abusive,":[52],"hate,":[53],"violence,":[54],"pornographic,":[55],"none":[57],"offensive)":[58],"by":[59,115],"Arabic-Hebrew":[60],"bilingual":[61],"speakers.":[62],"The":[63],"annotation":[64],"process":[65],"challenging":[67],"each":[69,88],"annotator":[70],"expected":[72],"to":[73,83,156],"be":[74,153],"familiar":[75],"the":[77,85,157],"Israeli":[78],"culture,":[79],"politics,":[80],"and":[81,97,103,128,143,164,171],"practices":[82],"understand":[84],"context":[86],"tweet.":[89],"We":[90,107],"fine-tuned":[91,165],"two":[92],"Hebrew":[93],"BERT":[94],"models,":[95],"HeBERT":[96,113],"AlephBERT,":[98],"using":[99],"our":[100,110,126,146,159],"proposed":[101],"dataset":[102,163],"another":[104],"published":[105],"dataset.":[106],"observed":[108],"that":[109],"data":[111,127,147,160],"boosts":[112],"performance":[114],"2%":[116],"when":[117],"combined":[118],"D<inf":[120,131,140],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[121,132,141],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">OLaH</inf>.":[122],"Fine-tuning":[123],"AlephBERT":[124],"on":[125,130,139,145,169],"testing":[129,144],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">OLaH</inf>":[133,142],"yields":[134,148],"69%":[135],"accuracy,":[136,150],"while":[137],"fine-tuning":[138],"57%":[149],"which":[151],"may":[152],"an":[154],"indication":[155],"generalizability":[158],"offers.":[161],"Our":[162],"models":[166],"are":[167],"available":[168],"GitHub":[170],"Huggingface.":[172]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-24T08:23:43.765630","created_date":"2025-10-10T00:00:00"}
