{"id":"https://openalex.org/W7153002337","doi":"https://doi.org/10.48550/arxiv.2604.07729","title":"Emotion Concepts and their Function in a Large Language Model","display_name":"Emotion Concepts and their Function in a Large Language Model","publication_year":2026,"publication_date":"2026-04-09","ids":{"openalex":"https://openalex.org/W7153002337","doi":"https://doi.org/10.48550/arxiv.2604.07729"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.07729","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07729","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.07729","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014438127","display_name":"Nicholas Sofroniew","orcid":"https://orcid.org/0000-0002-3426-0914"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sofroniew, Nicholas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076848733","display_name":"Isaac Kauvar","orcid":"https://orcid.org/0000-0002-1336-0721"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kauvar, Isaac","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133324927","display_name":"William Saunders","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saunders, William","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021606299","display_name":"Runjin Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Runjin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110225167","display_name":"Tom Henighan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Henighan, Tom","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133350700","display_name":"Sasha Hydrie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hydrie, Sasha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133373795","display_name":"Craig Citro","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Citro, Craig","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133343568","display_name":"Adam Pearce","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pearce, Adam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122414842","display_name":"Julius Tarng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tarng, Julius","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036313350","display_name":"Wes Gurnee","orcid":"https://orcid.org/0000-0002-0752-3934"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gurnee, Wes","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029631340","display_name":"Joshua Batson","orcid":"https://orcid.org/0000-0002-9244-2142"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Batson, Joshua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133354032","display_name":"Sam Zimmerman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zimmerman, Sam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133363102","display_name":"Kelley Rivoire","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rivoire, Kelley","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123209938","display_name":"Kyle Fish","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fish, Kyle","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039751155","display_name":"Chris Olah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Olah, Chris","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5006832724","display_name":"Jack Lindsey","orcid":"https://orcid.org/0000-0003-0930-7327"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lindsey, Jack","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":16,"corresponding_author_ids":["https://openalex.org/A5014438127"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.2809999883174896,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.2809999883174896,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.10980000346899033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.09910000115633011,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.592199981212616},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.592199981212616},{"id":"https://openalex.org/keywords/expression","display_name":"Expression (computer science)","score":0.5921000242233276},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5289000272750854},{"id":"https://openalex.org/keywords/phenomenon","display_name":"Phenomenon","score":0.5113000273704529},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.3898000121116638},{"id":"https://openalex.org/keywords/human-language","display_name":"Human language","score":0.34380000829696655},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3264000117778778}],"concepts":[{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.6187000274658203},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.6082000136375427},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.592199981212616},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.592199981212616},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.5921000242233276},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5289000272750854},{"id":"https://openalex.org/C50335755","wikidata":"https://www.wikidata.org/wiki/Q483247","display_name":"Phenomenon","level":2,"score":0.5113000273704529},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.3898000121116638},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.36469998955726624},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.3499000072479248},{"id":"https://openalex.org/C2993724205","wikidata":"https://www.wikidata.org/wiki/Q315","display_name":"Human language","level":2,"score":0.34380000829696655},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3264000117778778},{"id":"https://openalex.org/C128534915","wikidata":"https://www.wikidata.org/wiki/Q3475770","display_name":"Affective science","level":3,"score":0.3028999865055084},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.28940001130104065},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.2815000116825104},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.2736999988555908},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.2614000141620636},{"id":"https://openalex.org/C2777601897","wikidata":"https://www.wikidata.org/wiki/Q3409113","display_name":"Presentation (obstetrics)","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.25999999046325684},{"id":"https://openalex.org/C168862018","wikidata":"https://www.wikidata.org/wiki/Q5373805","display_name":"Emotionality","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.07729","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07729","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.07729","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07729","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.525890052318573,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"sometimes":[4],"appear":[5,171],"to":[6,76,116,172],"exhibit":[7],"emotional":[8],"reactions.":[9],"We":[10,27,114],"investigate":[11],"why":[12],"this":[13,117],"is":[14,88],"the":[15,36,57,78,94,120,134,177],"case":[16],"in":[17,66,70],"Claude":[18],"Sonnet":[19],"4.5":[20],"and":[21,43,47,81,100,112,128,158],"explore":[22],"implications":[23],"for":[24,175],"alignment-relevant":[25],"behavior.":[26,179],"find":[28],"internal":[29],"representations":[30,55,91,145],"of":[31,39,103,126,136,146,168],"emotion":[32,42,59,147],"concepts,":[33],"which":[34,139],"encode":[35],"broad":[37],"concept":[38,60],"a":[40,62,67],"particular":[41],"generalize":[44],"across":[45],"contexts":[46],"behaviors":[48,106],"it":[49],"might":[50],"be":[51,173],"linked":[52],"to.":[53],"These":[54],"track":[56],"operative":[58],"at":[61],"given":[63],"token":[64],"position":[65],"conversation,":[68],"activating":[69],"accordance":[71],"with":[72],"that":[73,89,162],"emotion's":[74],"relevance":[75],"processing":[77],"present":[79],"context":[80],"predicting":[82],"upcoming":[83],"text.":[84],"Our":[85],"key":[86],"finding":[87],"these":[90],"causally":[92],"influence":[93,135],"LLM's":[95],"outputs,":[96],"including":[97],"Claude's":[98],"preferences":[99],"its":[101],"rate":[102],"exhibiting":[104,122],"misaligned":[105],"such":[107],"as":[108,119],"reward":[109],"hacking,":[110],"blackmail,":[111],"sycophancy.":[113],"refer":[115],"phenomenon":[118],"LLM":[121],"functional":[123],"emotions:":[124],"patterns":[125],"expression":[127],"behavior":[129],"modeled":[130],"after":[131],"humans":[132],"under":[133],"an":[137],"emotion,":[138],"are":[140],"mediated":[141],"by":[142],"underlying":[143],"abstract":[144],"concepts.":[148],"Functional":[149],"emotions":[150],"may":[151],"work":[152],"quite":[153],"differently":[154],"from":[155],"human":[156],"emotions,":[157,169],"do":[159],"not":[160],"imply":[161],"LLMs":[163],"have":[164],"any":[165],"subjective":[166],"experience":[167],"but":[170],"important":[174],"understanding":[176],"model's":[178]},"counts_by_year":[{"year":2026,"cited_by_count":2}],"updated_date":"2026-05-27T09:02:27.158192","created_date":"2026-04-11T00:00:00"}
