{"id":"https://openalex.org/W7155195780","doi":"https://doi.org/10.48550/arxiv.2604.18729","title":"Investigating Counterfactual Unfairness in LLMs towards Identities through Humor","display_name":"Investigating Counterfactual Unfairness in LLMs towards Identities through Humor","publication_year":2026,"publication_date":"2026-04-20","ids":{"openalex":"https://openalex.org/W7155195780","doi":"https://doi.org/10.48550/arxiv.2604.18729"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.18729","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18729","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.18729","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080089655","display_name":"S.-H. Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Shubin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134300118","display_name":"Yejin Son","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Son, Yejin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026618714","display_name":"Junyeong Park","orcid":"https://orcid.org/0000-0001-5325-7588"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Junyeong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134282096","display_name":"Keummin Ka","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ka, Keummin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054161559","display_name":"Seungbeen Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Seungbeen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134217108","display_name":"Jaeyoung Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Jaeyoung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046714396","display_name":"Hyeju Jang","orcid":"https://orcid.org/0000-0002-7652-1158"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jang, Hyeju","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134288450","display_name":"Alice Oh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oh, Alice","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101881857","display_name":"Youngjae Yu","orcid":"https://orcid.org/0000-0002-5867-0782"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Youngjae","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11795","display_name":"Humor Studies and Applications","score":0.979200005531311,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11795","display_name":"Humor Studies and Applications","score":0.979200005531311,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11148","display_name":"Language, Metaphor, and Cognition","score":0.0038999998942017555,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.0012000000569969416,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.8125},{"id":"https://openalex.org/keywords/harm","display_name":"Harm","score":0.6707000136375427},{"id":"https://openalex.org/keywords/social-identity-theory","display_name":"Social identity theory","score":0.4875999987125397},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.4546000063419342},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.4074000120162964},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.3643999993801117},{"id":"https://openalex.org/keywords/social-relation","display_name":"Social relation","score":0.34060001373291016}],"concepts":[{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.8125},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.7160999774932861},{"id":"https://openalex.org/C2777363581","wikidata":"https://www.wikidata.org/wiki/Q15098235","display_name":"Harm","level":2,"score":0.6707000136375427},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.6682000160217285},{"id":"https://openalex.org/C98447023","wikidata":"https://www.wikidata.org/wiki/Q1540351","display_name":"Social identity theory","level":3,"score":0.4875999987125397},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.4546000063419342},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.4074000120162964},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.3643999993801117},{"id":"https://openalex.org/C130064352","wikidata":"https://www.wikidata.org/wiki/Q853725","display_name":"Social relation","level":2,"score":0.34060001373291016},{"id":"https://openalex.org/C131158328","wikidata":"https://www.wikidata.org/wiki/Q1307337","display_name":"Social influence","level":2,"score":0.2935999929904938},{"id":"https://openalex.org/C99821215","wikidata":"https://www.wikidata.org/wiki/Q1136583","display_name":"Swap (finance)","level":2,"score":0.29100000858306885},{"id":"https://openalex.org/C86658582","wikidata":"https://www.wikidata.org/wiki/Q1432778","display_name":"Social cognition","level":3,"score":0.28870001435279846},{"id":"https://openalex.org/C164850336","wikidata":"https://www.wikidata.org/wiki/Q3685487","display_name":"Interpersonal communication","level":2,"score":0.2703999876976013},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.2694000005722046},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C187206662","wikidata":"https://www.wikidata.org/wiki/Q55607920","display_name":"Social dilemma","level":2,"score":0.2651999890804291},{"id":"https://openalex.org/C192562157","wikidata":"https://www.wikidata.org/wiki/Q316694","display_name":"Rhetorical question","level":2,"score":0.26489999890327454},{"id":"https://openalex.org/C91034043","wikidata":"https://www.wikidata.org/wiki/Q223642","display_name":"Interpersonal relationship","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.18729","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18729","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.18729","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18729","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.5055047869682312,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Humor":[0],"holds":[1],"up":[2,120,133],"a":[3,142],"mirror":[4],"to":[5,121,134],"social":[6,32,139],"perception:":[7],"what":[8],"we":[9,15,19,43,57],"find":[10],"funny":[11],"often":[12],"reflects":[13],"who":[14,59,62],"are":[16,118],"and":[17,61,81,89,131,150,160],"how":[18,51,148],"judge":[20],"others.":[21],"When":[22],"language":[23],"models":[24,108],"engage":[25],"with":[26],"humor,":[27],"their":[28],"reactions":[29],"expose":[30],"the":[31,52],"assumptions":[33],"they":[34],"have":[35],"internalized":[36],"from":[37],"training":[38],"data.":[39],"In":[40],"this":[41],"paper,":[42],"investigate":[44],"counterfactual":[45],"unfairness":[46],"through":[47],"humor":[48,75,88],"by":[49,115],"observing":[50],"model's":[53],"responses":[54],"change":[55],"when":[56],"swap":[58],"speaks":[60],"is":[63],"addressed":[64],"while":[65],"holding":[66],"other":[67],"factors":[68],"constant.":[69],"Our":[70],"framework":[71],"spans":[72],"three":[73],"tasks:":[74],"generation":[76],"refusal,":[77],"speaker":[78],"intention":[79],"inference,":[80],"relational/societal":[82],"impact":[83],"prediction,":[84],"covering":[85],"both":[86],"identity-agnostic":[87],"identity-specific":[90],"disparagement":[91],"humor.":[92],"We":[93],"introduce":[94],"interpretable":[95],"bias":[96],"metrics":[97],"that":[98],"capture":[99],"asymmetric":[100],"patterns":[101,146],"under":[102],"identity":[103],"swaps.":[104],"Experiments":[105],"across":[106],"state-of-the-art":[107],"reveal":[109],"consistent":[110],"relational":[111],"disparities:":[112],"jokes":[113],"told":[114],"privileged":[116],"speakers":[117],"refused":[119],"67.5%":[122],"more":[123,129],"often,":[124],"judged":[125],"as":[126],"malicious":[127],"64.7%":[128],"frequently,":[130],"rated":[132],"1.5":[135],"points":[136],"higher":[137],"in":[138,153],"harm":[140],"on":[141],"5-point":[143],"scale.":[144],"These":[145],"highlight":[147],"sensitivity":[149],"stereotyping":[151],"coexist":[152],"generative":[154],"models,":[155],"complicating":[156],"efforts":[157],"toward":[158],"fairness":[159],"cultural":[161],"alignment.":[162]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-23T00:00:00"}
