{"id":"https://openalex.org/W7128525443","doi":"https://doi.org/10.48550/arxiv.2602.07639","title":"Letting Tutor Personas \"Speak Up\" for LLMs: Learning Steering Vectors from Dialogue via Preference Optimization","display_name":"Letting Tutor Personas \"Speak Up\" for LLMs: Learning Steering Vectors from Dialogue via Preference Optimization","publication_year":2026,"publication_date":"2026-02-07","ids":{"openalex":"https://openalex.org/W7128525443","doi":"https://doi.org/10.48550/arxiv.2602.07639"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.07639","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125517153","display_name":"Jaewook Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lee, Jaewook","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008589669","display_name":"Alexander Scarlatos","orcid":"https://orcid.org/0000-0001-6419-5909"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Scarlatos, Alexander","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034068210","display_name":"Simon Woodhead","orcid":"https://orcid.org/0000-0002-2192-9797"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Woodhead, Simon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5122324618","display_name":"Andrew Lan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lan, Andrew","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5125517153"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14074","display_name":"Persona Design and Applications","score":0.44369998574256897,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14074","display_name":"Persona Design and Applications","score":0.44369998574256897,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.07930000126361847,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12128","display_name":"AI in Service Interactions","score":0.06549999862909317,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/tutor","display_name":"TUTOR","score":0.8233000040054321},{"id":"https://openalex.org/keywords/preference","display_name":"Preference","score":0.7156000137329102},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.6579999923706055},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5911999940872192},{"id":"https://openalex.org/keywords/persona","display_name":"Persona","score":0.569599986076355},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.47440001368522644}],"concepts":[{"id":"https://openalex.org/C2778371403","wikidata":"https://www.wikidata.org/wiki/Q7672049","display_name":"TUTOR","level":2,"score":0.8233000040054321},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.7156000137329102},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6643000245094299},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.6579999923706055},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5911999940872192},{"id":"https://openalex.org/C313442","wikidata":"https://www.wikidata.org/wiki/Q778556","display_name":"Persona","level":2,"score":0.569599986076355},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5273000001907349},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4945000112056732},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.47440001368522644},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.4675999879837036},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3395000100135803},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.3009999990463257},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.29919999837875366},{"id":"https://openalex.org/C179748633","wikidata":"https://www.wikidata.org/wiki/Q7160411","display_name":"Peer tutor","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.28060001134872437},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.26190000772476196}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.07639","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.07639","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.07639","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.07639","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7989947199821472,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,40,60,163],"emergence":[2],"of":[3,12,42,62,162],"large":[4],"language":[5],"models":[6],"(LLMs)":[7],"as":[8],"a":[9,32,119],"powerful":[10],"class":[11],"generative":[13],"artificial":[14],"intelligence":[15],"(AI),":[16],"their":[17],"use":[18],"in":[19,70,94,177,196],"tutoring":[20,29,43,178],"has":[21],"become":[22],"increasingly":[23],"prominent.":[24],"Prior":[25],"works":[26],"on":[27,107],"LLM-based":[28],"typically":[30],"learn":[31,118],"single":[33],"tutor":[34,91,131,150],"policy":[35],"and":[36,67,82,152,189],"do":[37],"not":[38],"capture":[39],"diversity":[41],"styles.":[44],"In":[45,85],"real-world":[46],"tutor-student":[47,96],"interactions,":[48],"pedagogical":[49],"intent":[50],"is":[51],"realized":[52],"through":[53],"adaptive":[54],"instructional":[55,64],"strategies,":[56],"with":[57,148],"tutors":[58],"varying":[59],"level":[61],"scaffolding,":[63],"directiveness,":[65],"feedback,":[66],"affective":[68],"support":[69],"response":[71],"to":[72,101,117,174],"learners'":[73],"needs.":[74],"These":[75,180],"differences":[76,176],"can":[77,98],"all":[78],"impact":[79],"dialogue":[80,143,204],"dynamics":[81],"student":[83],"engagement.":[84],"this":[86,136],"paper,":[87],"we":[88],"explore":[89],"how":[90],"personas":[92],"embedded":[93],"human":[95,203],"dialogues":[97],"be":[99],"used":[100],"guide":[102],"LLM":[103],"behavior":[104],"without":[105],"relying":[106],"explicitly":[108],"prompted":[109],"instructions.":[110],"We":[111,133],"modify":[112],"Bidirectional":[113],"Preference":[114],"Optimization":[115],"(BiPO)":[116],"steering":[120,137,185],"vector,":[121],"an":[122,187],"activation-space":[123],"direction":[124],"that":[125,135,183],"steers":[126],"model":[127],"responses":[128],"towards":[129],"certain":[130],"personas.":[132],"find":[134],"vector":[138],"captures":[139],"tutor-specific":[140,194],"variation":[141,195],"across":[142,171],"contexts,":[144],"improving":[145],"semantic":[146],"alignment":[147],"ground-truth":[149],"utterances":[151],"increasing":[153],"preference-based":[154],"evaluations,":[155],"while":[156],"largely":[157],"preserving":[158],"lexical":[159],"similarity.":[160],"Analysis":[161],"learned":[164],"directional":[165],"coefficients":[166],"further":[167],"reveals":[168],"interpretable":[169,190],"structure":[170],"tutors,":[172],"corresponding":[173],"consistent":[175],"behavior.":[179],"results":[181],"demonstrate":[182],"activation":[184],"offers":[186],"effective":[188],"way":[191],"for":[192],"controlling":[193],"LLMs":[197],"using":[198],"signals":[199],"derived":[200],"directly":[201],"from":[202],"data.":[205]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-11T00:00:00"}
