{"id":"https://openalex.org/W7138177845","doi":"https://doi.org/10.48550/arxiv.2603.13249","title":"Steering at the Source: Style Modulation Heads for Robust Persona Control","display_name":"Steering at the Source: Style Modulation Heads for Robust Persona Control","publication_year":2026,"publication_date":"2026-02-24","ids":{"openalex":"https://openalex.org/W7138177845","doi":"https://doi.org/10.48550/arxiv.2603.13249"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.13249","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13249","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.13249","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129672143","display_name":"Yoshihiro Izawa","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Izawa, Yoshihiro","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012454552","display_name":"Gouki Minegishi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Minegishi, Gouki","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108320347","display_name":"Koshi Eguchi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eguchi, Koshi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129681703","display_name":"Sosuke Hosokawa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hosokawa, Sosuke","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5009359355","display_name":"Kenjiro Taura","orcid":"https://orcid.org/0000-0001-5224-382X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taura, Kenjiro","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5129672143"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14074","display_name":"Persona Design and Applications","score":0.4634000062942505,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14074","display_name":"Persona Design and Applications","score":0.4634000062942505,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.045499999076128006,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.04039999842643738,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/safer","display_name":"SAFER","score":0.5608999729156494},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.5468999743461609},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5220000147819519},{"id":"https://openalex.org/keywords/degradation","display_name":"Degradation (telecommunications)","score":0.43689998984336853},{"id":"https://openalex.org/keywords/modulation","display_name":"Modulation (music)","score":0.39649999141693115},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.39149999618530273},{"id":"https://openalex.org/keywords/cosine-similarity","display_name":"Cosine similarity","score":0.38659998774528503},{"id":"https://openalex.org/keywords/persona","display_name":"Persona","score":0.3765000104904175}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.632099986076355},{"id":"https://openalex.org/C2776654903","wikidata":"https://www.wikidata.org/wiki/Q2601463","display_name":"SAFER","level":2,"score":0.5608999729156494},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.5468999743461609},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5220000147819519},{"id":"https://openalex.org/C2779679103","wikidata":"https://www.wikidata.org/wiki/Q5251805","display_name":"Degradation (telecommunications)","level":2,"score":0.43689998984336853},{"id":"https://openalex.org/C123079801","wikidata":"https://www.wikidata.org/wiki/Q750240","display_name":"Modulation (music)","level":2,"score":0.39649999141693115},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.39149999618530273},{"id":"https://openalex.org/C2780762811","wikidata":"https://www.wikidata.org/wiki/Q1784941","display_name":"Cosine similarity","level":3,"score":0.38659998774528503},{"id":"https://openalex.org/C313442","wikidata":"https://www.wikidata.org/wiki/Q778556","display_name":"Persona","level":2,"score":0.3765000104904175},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36980000138282776},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3562000095844269},{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.35510000586509705},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3447999954223633},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.3294000029563904},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3255000114440918},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.30649998784065247},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.29490000009536743},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.2896000146865845},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.28369998931884766},{"id":"https://openalex.org/C144745244","wikidata":"https://www.wikidata.org/wiki/Q4927286","display_name":"Blocking (statistics)","level":2,"score":0.2678000032901764},{"id":"https://openalex.org/C150594956","wikidata":"https://www.wikidata.org/wiki/Q1334829","display_name":"Wearable computer","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.13249","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13249","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.13249","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13249","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.5774791836738586,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Activation":[0],"steering":[1],"offers":[2],"a":[3,25,60],"computationally":[4],"efficient":[5],"mechanism":[6],"for":[7],"controlling":[8,17],"Large":[9],"Language":[10],"Models":[11],"(LLMs)":[12],"without":[13],"fine-tuning.":[14],"While":[15],"effectively":[16],"target":[18],"traits":[19],"(e.g.,":[20],"persona),":[21],"coherency":[22,119],"degradation":[23,37,120],"remains":[24],"major":[26],"obstacle":[27],"to":[28],"safety":[29],"and":[30,50,73,98,137],"practical":[31],"deployment.":[32],"We":[33,102],"hypothesize":[34],"that":[35,69,104,131],"this":[36,56],"stems":[38],"from":[39],"intervening":[40],"on":[41],"the":[42,118],"residual":[43,123],"stream,":[44],"which":[45,76],"indiscriminately":[46],"affects":[47],"aggregated":[48],"features":[49],"inadvertently":[51],"amplifies":[52],"off-target":[53],"noise.":[54],"In":[55],"work,":[57],"we":[58,77],"identify":[59],"sparse":[61],"subset":[62],"of":[63,91],"attention":[64],"heads":[65,84,110],"(only":[66],"three":[67],"heads)":[68],"independently":[70],"govern":[71],"persona":[72],"style":[74],"formation,":[75],"term":[78],"Style":[79],"Modulation":[80],"Heads.":[81],"Specifically,":[82],"these":[83,108],"can":[85],"be":[86],"localized":[87],"via":[88],"geometric":[89],"analysis":[90],"internal":[92],"representations,":[93],"combining":[94],"layer-wise":[95],"cosine":[96],"similarity":[97],"head-wise":[99],"contribution":[100],"scores.":[101],"demonstrate":[103],"intervention":[105],"targeting":[106],"only":[107],"specific":[109],"achieves":[111],"robust":[112],"behavioral":[113],"control":[114],"while":[115],"significantly":[116],"mitigating":[117],"observed":[121],"in":[122],"stream":[124],"steering.":[125],"More":[126],"broadly,":[127],"our":[128],"findings":[129],"show":[130],"precise,":[132],"component-level":[133],"localization":[134],"enables":[135],"safer":[136],"more":[138],"precise":[139],"model":[140],"control.":[141]},"counts_by_year":[],"updated_date":"2026-03-18T06:31:55.123368","created_date":"2026-03-18T00:00:00"}
