{"id":"https://openalex.org/W7154736432","doi":"https://doi.org/10.48550/arxiv.2604.14463","title":"Psychological Steering of Large Language Models","display_name":"Psychological Steering of Large Language Models","publication_year":2026,"publication_date":"2026-04-15","ids":{"openalex":"https://openalex.org/W7154736432","doi":"https://doi.org/10.48550/arxiv.2604.14463"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.14463","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14463","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.14463","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133898760","display_name":"Leonardo Blas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Blas, Leonardo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133885567","display_name":"Robin Jia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia, Robin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133905999","display_name":"Emilio Ferrara","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ferrara, Emilio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.3447999954223633,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.3447999954223633,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.1071000024676323,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.08889999985694885,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6227999925613403},{"id":"https://openalex.org/keywords/trait","display_name":"Trait","score":0.47749999165534973},{"id":"https://openalex.org/keywords/personality","display_name":"Personality","score":0.4323999881744385},{"id":"https://openalex.org/keywords/covariance","display_name":"Covariance","score":0.41769999265670776},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4065999984741211},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.4049000144004822},{"id":"https://openalex.org/keywords/intervention","display_name":"Intervention (counseling)","score":0.38019999861717224}],"concepts":[{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6227999925613403},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5634999871253967},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5338000059127808},{"id":"https://openalex.org/C106934330","wikidata":"https://www.wikidata.org/wiki/Q1971873","display_name":"Trait","level":2,"score":0.47749999165534973},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.45719999074935913},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.43959999084472656},{"id":"https://openalex.org/C187288502","wikidata":"https://www.wikidata.org/wiki/Q641118","display_name":"Personality","level":2,"score":0.4323999881744385},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4255000054836273},{"id":"https://openalex.org/C178650346","wikidata":"https://www.wikidata.org/wiki/Q201984","display_name":"Covariance","level":2,"score":0.41769999265670776},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4065999984741211},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.4049000144004822},{"id":"https://openalex.org/C2780665704","wikidata":"https://www.wikidata.org/wiki/Q959298","display_name":"Intervention (counseling)","level":2,"score":0.38019999861717224},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3637000024318695},{"id":"https://openalex.org/C115051666","wikidata":"https://www.wikidata.org/wiki/Q6522493","display_name":"Ranging","level":2,"score":0.3425000011920929},{"id":"https://openalex.org/C2865642","wikidata":"https://www.wikidata.org/wiki/Q378132","display_name":"Big Five personality traits","level":3,"score":0.2825999855995178},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.28189998865127563},{"id":"https://openalex.org/C2778571376","wikidata":"https://www.wikidata.org/wiki/Q1355821","display_name":"Frontier","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.25619998574256897},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.14463","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14463","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.14463","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14463","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","score":0.8662850260734558,"display_name":"Life below water"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"emulate":[4],"a":[5,55,134,145,215],"consistent":[6],"human-like":[7],"behavior":[8],"that":[9,59,96,144,180,207],"can":[10],"be":[11],"shaped":[12],"through":[13],"activation-level":[14],"interventions.":[15],"This":[16],"paradigm":[17],"is":[18],"converging":[19],"on":[20,26],"additive":[21],"residual-stream":[22,73],"injections,":[23],"which":[24,83],"rely":[25],"injection-strength":[27],"sweeps":[28,63],"to":[29,89,122,167,172],"approximate":[30],"optimal":[31,49],"intervention":[32,50],"settings.":[33],"However,":[34],"existing":[35],"methods":[36,154],"restrict":[37],"the":[38,81,85,185,210],"search":[39],"space":[40],"and":[41,71,78,129,149,169,189,220],"sweep":[42],"in":[43,64,110,113,137,155],"uncalibrated":[44],"activation-space":[45],"units,":[46],"potentially":[47],"missing":[48],"conditions.":[51],"Thus,":[52],"we":[53,79,142,178],"introduce":[54],"psychological":[56,76,139,197],"steering":[57],"framework":[58],"performs":[60],"unbounded,":[61],"fluency-constrained":[62],"semantically":[65],"calibrated":[66],"units.":[67],"Our":[68],"method":[69],"derives":[70],"calibrates":[72],"injections":[74,99,151,182],"using":[75],"artifacts,":[77],"use":[80],"IPIP-NEO-120,":[82],"measures":[84],"OCEAN":[86,108,203],"personality":[87],"model,":[88,213],"compare":[90],"six":[91],"injection":[92],"methods.":[93],"We":[94],"find":[95,143],"mean-difference":[97],"(MD)":[98],"outperform":[100],"Personality":[101],"Prompting":[102],"(P$^2$),":[103],"an":[104],"established":[105],"baseline":[106],"for":[107,196],"steering,":[109],"open-ended":[111,138],"generation":[112],"11":[114],"of":[115,120,147,157],"14":[116,158],"LLMs,":[117,159],"with":[118,160,184],"gains":[119,161],"3.6\\%":[121],"16.4\\%,":[123],"overturning":[124],"prior":[125],"reports":[126],"favoring":[127],"prompting":[128],"positioning":[130],"representation":[131],"engineering":[132],"as":[133],"new":[135],"frontier":[136],"steering.":[140,198],"Further,":[141],"hybrid":[146],"P$^2$":[148,163],"MD":[150,175,181],"outperforms":[152],"both":[153],"13":[156],"over":[162,174],"ranging":[164],"from":[165,170,209],"5.6\\%":[166],"21.9\\%":[168],"3.3\\%":[171],"26.7\\%":[173],"injections.":[176],"Finally,":[177],"show":[179],"align":[183],"Linear":[186],"Representation":[187],"Hypothesis":[188],"provide":[190],"reliable,":[191],"approximately":[192],"linear":[193],"control":[194],"knobs":[195],"Nevertheless,":[199],"they":[200],"also":[201],"induce":[202],"trait":[204],"covariance":[205],"patterns":[206],"depart":[208],"Big":[211],"Two":[212],"suggesting":[214],"gap":[216],"between":[217],"learned":[218],"representations":[219],"human":[221],"psychology.":[222]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-18T00:00:00"}
