{"id":"https://openalex.org/W7140214165","doi":"https://doi.org/10.48550/arxiv.2603.21298","title":"More Than Sum of Its Parts: Deciphering Intent Shifts in Multimodal Hate Speech Detection","display_name":"More Than Sum of Its Parts: Deciphering Intent Shifts in Multimodal Hate Speech Detection","publication_year":2026,"publication_date":"2026-03-22","ids":{"openalex":"https://openalex.org/W7140214165","doi":"https://doi.org/10.48550/arxiv.2603.21298"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.21298","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21298","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.21298","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Sun, Runze","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sun, Runze","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zheng, Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Yu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Xiong, Zexuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiong, Zexuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Qu, Zhongjin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qu, Zhongjin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Chen, Lei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Lei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhou, Jie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Jie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Lu, Jiwen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Jiwen","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.0017000000225380063,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.0010999999940395355,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decipher","display_name":"DECIPHER","score":0.6844000220298767},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5597000122070312},{"id":"https://openalex.org/keywords/meaning","display_name":"Meaning (existential)","score":0.5088000297546387},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4810999929904938},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.42989999055862427},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.37220001220703125},{"id":"https://openalex.org/keywords/semantic-gap","display_name":"Semantic gap","score":0.35440000891685486},{"id":"https://openalex.org/keywords/suspect","display_name":"Suspect","score":0.3343999981880188}],"concepts":[{"id":"https://openalex.org/C164614171","wikidata":"https://www.wikidata.org/wiki/Q5204775","display_name":"DECIPHER","level":2,"score":0.6844000220298767},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6807000041007996},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5597000122070312},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.5088000297546387},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4810999929904938},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.42989999055862427},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3763999938964844},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.37220001220703125},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.35440000891685486},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3528999984264374},{"id":"https://openalex.org/C2778223634","wikidata":"https://www.wikidata.org/wiki/Q224952","display_name":"Suspect","level":2,"score":0.3343999981880188},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3165000081062317},{"id":"https://openalex.org/C2776372474","wikidata":"https://www.wikidata.org/wiki/Q508291","display_name":"Simplicity","level":2,"score":0.3156000077724457},{"id":"https://openalex.org/C59577422","wikidata":"https://www.wikidata.org/wiki/Q10265143","display_name":"False accusation","level":2,"score":0.31049999594688416},{"id":"https://openalex.org/C130440534","wikidata":"https://www.wikidata.org/wiki/Q14946528","display_name":"Conflation","level":2,"score":0.3091999888420105},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.29490000009536743},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.2919999957084656},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.2782000005245209},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.2703000009059906},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.2694000005722046},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2615000009536743}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.21298","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21298","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.21298","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21298","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.8134792447090149,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Combating":[0],"hate":[1,25,88],"speech":[2,26],"on":[3,14,48,117,183,194],"social":[4],"media":[5],"is":[6,27],"critical":[7],"for":[8,157,186],"securing":[9],"cyberspace,":[10],"yet":[11],"relies":[12],"heavily":[13],"the":[15,59,63,105,113,118,139,163],"efficacy":[16],"of":[17,65,121],"automated":[18],"detection":[19],"systems.":[20],"As":[21],"content":[22,57],"formats":[23],"evolve,":[24],"transitioning":[28],"from":[29,89],"solely":[30],"plain":[31],"text":[32],"to":[33,41,77,85,165],"complex":[34,134],"multimodal":[35,56],"expressions,":[36],"making":[37],"implicit":[38,87,188],"attacks":[39],"harder":[40],"spot.":[42],"Current":[43],"systems,":[44],"however,":[45],"often":[46],"falter":[47],"these":[49,133],"subtle":[50],"cases,":[51,189],"as":[52],"they":[53],"struggle":[54],"with":[55],"where":[58,82,112,153],"emergent":[60],"meaning":[61],"transcends":[62],"aggregation":[64],"individual":[66],"modalities.":[67],"To":[68,130],"bridge":[69],"this":[70,100],"gap,":[71],"we":[72,103,136],"move":[73],"beyond":[74],"binary":[75],"classification":[76],"characterize":[78],"semantic":[79,96,168],"intent":[80,115],"shifts":[81],"modalities":[83,122],"interact":[84],"construct":[86],"benign":[90],"cues":[91,169],"or":[92,127],"neutralize":[93],"toxicity":[94],"through":[95],"inversion.":[97],"Guided":[98],"by":[99],"fine-grained":[101],"formulation,":[102],"curate":[104],"Hate":[106],"via":[107,142],"Vision-Language":[108],"Interplay":[109],"(H-VLI)":[110],"benchmark":[111],"true":[114],"hinges":[116],"intricate":[119],"interplay":[120],"rather":[123],"than":[124],"overt":[125],"visual":[126],"textual":[128],"slurs.":[129],"effectively":[131],"decipher":[132],"cues,":[135],"further":[137],"propose":[138],"Asymmetric":[140],"Reasoning":[141],"Courtroom":[143],"Agent":[144],"DEbate":[145],"(ARCADE)":[146],"framework.":[147],"By":[148],"simulating":[149],"a":[150,172],"judicial":[151],"process":[152],"agents":[154],"actively":[155],"argue":[156],"accusation":[158],"and":[159,199],"defense,":[160],"ARCADE":[161,178],"forces":[162],"model":[164],"scrutinize":[166],"deep":[167],"before":[170],"reaching":[171],"verdict.":[173],"Extensive":[174],"experiments":[175],"demonstrate":[176],"that":[177],"significantly":[179],"outperforms":[180],"state-of-the-art":[181],"baselines":[182],"H-VLI,":[184],"particularly":[185],"challenging":[187],"while":[190],"maintaining":[191],"competitive":[192],"performance":[193],"established":[195],"benchmarks.":[196],"Our":[197],"code":[198],"data":[200],"are":[201],"available":[202],"at:":[203],"https://github.com/Sayur1n/H-VLI":[204]},"counts_by_year":[],"updated_date":"2026-04-22T06:01:30.510260","created_date":"2026-03-25T00:00:00"}
