{"id":"https://openalex.org/W7116864210","doi":"https://doi.org/10.48550/arxiv.2512.17639","title":"Linear Personality Probing and Steering in LLMs: A Big Five Study","display_name":"Linear Personality Probing and Steering in LLMs: A Big Five Study","publication_year":2025,"publication_date":"2025-12-19","ids":{"openalex":"https://openalex.org/W7116864210","doi":"https://doi.org/10.48550/arxiv.2512.17639"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.17639","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.17639","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.17639","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017326060","display_name":"Michel Frising","orcid":"https://orcid.org/0000-0003-3725-4824"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Frising, Michel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121067474","display_name":"Daniel Balcells","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Balcells, Daniel","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5017326060"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11040","display_name":"Personality Traits and Psychology","score":0.8575000166893005,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11040","display_name":"Personality Traits and Psychology","score":0.8575000166893005,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.0272000003606081,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11519","display_name":"Digital Mental Health Interventions","score":0.00839999970048666,"subfield":{"id":"https://openalex.org/subfields/3202","display_name":"Applied Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/personality","display_name":"Personality","score":0.7139000296592712},{"id":"https://openalex.org/keywords/personality-psychology","display_name":"Personality psychology","score":0.6119999885559082},{"id":"https://openalex.org/keywords/big-five-personality-traits","display_name":"Big Five personality traits","score":0.6017000079154968},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5879999995231628},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.5698000192642212},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5572999715805054},{"id":"https://openalex.org/keywords/trait","display_name":"Trait","score":0.5282999873161316}],"concepts":[{"id":"https://openalex.org/C187288502","wikidata":"https://www.wikidata.org/wiki/Q641118","display_name":"Personality","level":2,"score":0.7139000296592712},{"id":"https://openalex.org/C25908422","wikidata":"https://www.wikidata.org/wiki/Q271716","display_name":"Personality psychology","level":3,"score":0.6119999885559082},{"id":"https://openalex.org/C2865642","wikidata":"https://www.wikidata.org/wiki/Q378132","display_name":"Big Five personality traits","level":3,"score":0.6017000079154968},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5879999995231628},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.5698000192642212},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5572999715805054},{"id":"https://openalex.org/C106934330","wikidata":"https://www.wikidata.org/wiki/Q1971873","display_name":"Trait","level":2,"score":0.5282999873161316},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4221000075340271},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.41510000824928284},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4115999937057495},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.3873000144958496},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.36390000581741333},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35899999737739563},{"id":"https://openalex.org/C3020318244","wikidata":"https://www.wikidata.org/wiki/Q4812187","display_name":"Large sample","level":2,"score":0.3190999925136566},{"id":"https://openalex.org/C3019152653","wikidata":"https://www.wikidata.org/wiki/Q186290","display_name":"Linear relationship","level":2,"score":0.30149999260902405},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.27970001101493835},{"id":"https://openalex.org/C24663603","wikidata":"https://www.wikidata.org/wiki/Q2428138","display_name":"16PF Questionnaire","level":5,"score":0.27730000019073486},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.26840001344680786},{"id":"https://openalex.org/C134238545","wikidata":"https://www.wikidata.org/wiki/Q4736511","display_name":"Alternative five model of personality","level":5,"score":0.2653000056743622},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.26499998569488525},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2599000036716461}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.17639","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.17639","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.17639","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.17639","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"exhibit":[4],"distinct":[5],"and":[6,13,28,43,54,77,92,106,140,146],"consistent":[7],"personalities":[8],"that":[9,18,118,153],"greatly":[10],"impact":[11],"trust":[12],"engagement.":[14],"While":[15],"this":[16,58],"means":[17],"personality":[19,70,121,163],"frameworks":[20],"would":[21],"be":[22,73],"highly":[23],"valuable":[24],"tools":[25],"to":[26,114],"characterize":[27],"control":[29],"LLMs'":[30],"behavior,":[31],"current":[32],"approaches":[33],"remain":[34],"either":[35],"costly":[36],"(post-training)":[37],"or":[38,185],"brittle":[39],"(prompt":[40],"engineering).":[41],"Probing":[42],"steering":[44,78,147,167],"via":[45],"linear":[46,63,128,154],"directions":[47,64,136,155],"has":[48],"recently":[49],"emerged":[50],"as":[51],"a":[52,132],"cheap":[53],"efficient":[55],"alternative.":[56],"In":[57],"paper,":[59],"we":[60,85,130],"investigate":[61],"whether":[62],"aligned":[65,156],"with":[66,103,157],"the":[67,101,109,192],"Big":[68,94],"Five":[69,95],"traits":[71,122],"can":[72],"used":[74],"for":[75,144,162],"probing":[76,145],"model":[79,102,148],"behavior.":[80,149],"Using":[81,127],"Llama":[82],"3.3":[83],"70B,":[84],"generate":[86],"descriptions":[87,105],"of":[88,134],"406":[89],"fictional":[90],"characters":[91],"their":[93,142,166],"trait":[96],"scores.":[97],"We":[98],"then":[99],"prompt":[100],"these":[104],"questions":[107],"from":[108],"Alpaca":[110],"questionnaire,":[111],"allowing":[112],"us":[113],"sample":[115],"hidden":[116],"activations":[117],"vary":[119],"along":[120],"in":[123,137,176,182,191],"known,":[124],"quantifiable":[125],"ways.":[126],"regression,":[129],"learn":[131],"set":[133],"per-layer":[135],"activation":[138],"space,":[139],"test":[141],"effectiveness":[143],"Our":[150],"results":[151],"suggest":[152],"trait-scores":[158],"are":[159],"effective":[160],"probes":[161],"detection,":[164],"while":[165],"capabilities":[168],"strongly":[169],"depend":[170],"on":[171],"context,":[172],"producing":[173],"reliable":[174],"effects":[175],"forced-choice":[177],"tasks":[178],"but":[179],"limited":[180],"influence":[181],"open-ended":[183],"generation":[184],"when":[186],"additional":[187],"context":[188],"is":[189],"present":[190],"prompt.":[193]},"counts_by_year":[],"updated_date":"2025-12-23T23:15:37.779995","created_date":"2025-12-23T00:00:00"}
