{"id":"https://openalex.org/W7161742693","doi":"https://doi.org/10.48550/arxiv.2605.16996","title":"Evaluation Drift in LLM Personality Induction: Are We Moving the Goalpost?","display_name":"Evaluation Drift in LLM Personality Induction: Are We Moving the Goalpost?","publication_year":2026,"publication_date":"2026-05-16","ids":{"openalex":"https://openalex.org/W7161742693","doi":"https://doi.org/10.48550/arxiv.2605.16996"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.16996","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.16996","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.16996","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058606449","display_name":"Prateek Rajput","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rajput, Prateek","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136466448","display_name":"Yewei Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Yewei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136454878","display_name":"Iyiola E. Olatunji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Olatunji, Iyiola E.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136457689","display_name":"Jacques Klein","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Klein, Jacques","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136488003","display_name":"Tegawend\u00e9 F. Bissyand\u00e9","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bissyand\u00e9, Tegawend\u00e9 F.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11040","display_name":"Personality Traits and Psychology","score":0.44780001044273376,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11040","display_name":"Personality Traits and Psychology","score":0.44780001044273376,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.12370000034570694,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.09099999815225601,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/personality","display_name":"Personality","score":0.8126000165939331},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.5885000228881836},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.5480999946594238},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.4900999963283539},{"id":"https://openalex.org/keywords/big-five-personality-traits","display_name":"Big Five personality traits","score":0.4683000147342682},{"id":"https://openalex.org/keywords/affect","display_name":"Affect (linguistics)","score":0.3741999864578247}],"concepts":[{"id":"https://openalex.org/C187288502","wikidata":"https://www.wikidata.org/wiki/Q641118","display_name":"Personality","level":2,"score":0.8126000165939331},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.6449999809265137},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.5885000228881836},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.5715000033378601},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.5480999946594238},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.4999000132083893},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.4900999963283539},{"id":"https://openalex.org/C2865642","wikidata":"https://www.wikidata.org/wiki/Q378132","display_name":"Big Five personality traits","level":3,"score":0.4683000147342682},{"id":"https://openalex.org/C2776035688","wikidata":"https://www.wikidata.org/wiki/Q1606558","display_name":"Affect (linguistics)","level":2,"score":0.3741999864578247},{"id":"https://openalex.org/C75630572","wikidata":"https://www.wikidata.org/wiki/Q538904","display_name":"Applied psychology","level":1,"score":0.33390000462532043},{"id":"https://openalex.org/C174010058","wikidata":"https://www.wikidata.org/wiki/Q7170643","display_name":"Personality Assessment Inventory","level":3,"score":0.3172999918460846},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2928999960422516},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.29170000553131104},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2815000116825104},{"id":"https://openalex.org/C138496976","wikidata":"https://www.wikidata.org/wiki/Q175002","display_name":"Developmental psychology","level":1,"score":0.2662000060081482},{"id":"https://openalex.org/C111370547","wikidata":"https://www.wikidata.org/wiki/Q7451120","display_name":"Sensory cue","level":2,"score":0.2599000036716461},{"id":"https://openalex.org/C80191262","wikidata":"https://www.wikidata.org/wiki/Q5477668","display_name":"Fragility","level":2,"score":0.2565000057220459}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.16996","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.16996","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.16996","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.16996","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.4960407018661499,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Can":[0],"large":[1],"language":[2],"models":[3],"reliably":[4],"express":[5],"a":[6,17,42,118],"human-like":[7],"personality,":[8],"or":[9,155],"are":[10],"they":[11],"merely":[12],"mimicking":[13],"surface":[14],"cues":[15,143],"without":[16],"stable":[18],"underlying":[19],"profile?":[20],"To":[21],"investigate":[22],"this,":[23],"we":[24,64],"induce":[25,82],"personality":[26,46,58,147],"in":[27,98,110],"LLMs":[28],"by":[29],"fine-tuning":[30,94],"them":[31],"on":[32,123],"the":[33,51,56,60,106,124,142],"long-form":[34],"essays,":[35],"where":[36],"each":[37],"essay":[38],"is":[39],"associated":[40],"with":[41],"target":[43,83],"Big":[44,84],"Five":[45,85],"profile.":[47],"We":[48,149],"then":[49],"evaluate":[50],"stability":[52,116],"and":[53,78],"fidelity":[54],"of":[55],"induced":[57],"using":[59],"IPIP-NEO":[61],"questionnaire.":[62],"Specifically,":[63],"ask:":[65],"(i)":[66],"does":[67],"post-training":[68],"(SFT,":[69],"DPO,":[70],"ORPO)":[71],"stabilize":[72],"questionnaire":[73,99],"scores":[74,134],"under":[75],"prompt":[76],"rephrasings,":[77],"(ii)":[79],"can":[80],"it":[81],"profiles":[86],"from":[87],"unguided":[88,139],"essays?":[89],"Our":[90],"results":[91],"demonstrate":[92],"that":[93,138,158],"consistently":[95],"reduces":[96],"variance":[97],"responses":[100],"across":[101],"five":[102],"models,":[103],"directly":[104],"mitigating":[105],"evaluation":[107],"fragility":[108],"reported":[109],"pre-trained":[111],"models.":[112],"However,":[113],"this":[114],"newfound":[115],"reveals":[117],"more":[119],"fundamental":[120],"limitation:":[121],"accuracy":[122],"full":[125],"five-dimensional":[126],"profile":[127],"remains":[128],"near":[129],"chance,":[130],"even":[131],"when":[132],"single-trait":[133],"improve.":[135],"This":[136],"indicates":[137],"essays":[140],"lack":[141],"needed":[144],"for":[145,152],"faithful":[146],"expression.":[148],"therefore":[150],"argue":[151],"scenario-grounded":[153],"datasets":[154],"interactive":[156],"elicitation":[157],"accumulates":[159],"test-aligned":[160],"evidence":[161],"over":[162],"time.":[163]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-20T00:00:00"}
