{"id":"https://openalex.org/W7152639304","doi":"https://doi.org/10.48550/arxiv.2604.06377","title":"The Master Key Hypothesis: Unlocking Cross-Model Capability Transfer via Linear Subspace Alignment","display_name":"The Master Key Hypothesis: Unlocking Cross-Model Capability Transfer via Linear Subspace Alignment","publication_year":2026,"publication_date":"2026-04-07","ids":{"openalex":"https://openalex.org/W7152639304","doi":"https://doi.org/10.48550/arxiv.2604.06377"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.06377","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06377","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.06377","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088070887","display_name":"Rishab Balasubramanian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Balasubramanian, Rishab","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133304326","display_name":"Pin-Jie Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Pin-Jie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128077487","display_name":"Rituraj Sharma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Rituraj","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049221759","display_name":"Anjie Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Anjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133276194","display_name":"Fardin Abdi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abdi, Fardin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091009689","display_name":"Viktor Rozgi\u0107","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rozgic, Viktor","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066223118","display_name":"Zheng Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Zheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133310665","display_name":"Mohit Bansal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bansal, Mohit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133243990","display_name":"Tu Vu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vu, Tu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.12129999697208405,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.12129999697208405,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.09019999951124191,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.0868000015616417,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.6503999829292297},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6290000081062317},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6194999814033508},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5685999989509583},{"id":"https://openalex.org/keywords/sharpening","display_name":"Sharpening","score":0.5644999742507935},{"id":"https://openalex.org/keywords/linear-model","display_name":"Linear model","score":0.3993000090122223},{"id":"https://openalex.org/keywords/latent-variable","display_name":"Latent variable","score":0.37229999899864197}],"concepts":[{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.6503999829292297},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6312999725341797},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6290000081062317},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6194999814033508},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5685999989509583},{"id":"https://openalex.org/C2781137444","wikidata":"https://www.wikidata.org/wiki/Q237105","display_name":"Sharpening","level":2,"score":0.5644999742507935},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4153999984264374},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.3993000090122223},{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.37229999899864197},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.3483999967575073},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.3328000009059906},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3312999904155731},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.30320000648498535},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.28529998660087585},{"id":"https://openalex.org/C6802819","wikidata":"https://www.wikidata.org/wiki/Q1072174","display_name":"Linear system","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C57489055","wikidata":"https://www.wikidata.org/wiki/Q190046","display_name":"Ellipsoid","level":2,"score":0.2614000141620636},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.2583000063896179},{"id":"https://openalex.org/C134261354","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical inference","level":2,"score":0.25699999928474426}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.06377","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06377","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.06377","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06377","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,21],"investigate":[1],"whether":[2],"post-trained":[3,159],"capabilities":[4,31,172,182],"can":[5],"be":[6],"transferred":[7],"across":[8,17,47,112],"models":[9,48],"without":[10,115],"retraining,":[11],"with":[12,80],"a":[13,36,59,66,81,85,136],"focus":[14],"on":[15,53,100,132,170],"transfer":[16,168],"different":[18],"model":[19,30,83,113],"scales.":[20],"propose":[22],"the":[23,97,153,157,165,171,185],"Master":[24],"Key":[25],"Hypothesis,":[26],"which":[27],"states":[28],"that":[29,40,64,164,177],"correspond":[32],"to":[33,95,124,142,150],"directions":[34],"in":[35],"low-dimensional":[37],"latent":[38,181],"subspace":[39],"induce":[41],"specific":[42],"behaviors":[43],"and":[44,61,74,89,106,134,176],"are":[45],"transferable":[46],"through":[49,84],"linear":[50,87],"alignment.":[51],"Based":[52],"this":[54],"hypothesis,":[55],"we":[56],"introduce":[57],"UNLOCK,":[58],"training-free":[60],"label-free":[62],"framework":[63],"extracts":[65],"capability":[67],"direction":[68,139],"by":[69,156,183],"contrasting":[70],"activations":[71],"between":[72],"capability-present":[73],"capability-absent":[75],"Source":[76],"variants,":[77],"aligns":[78],"it":[79,91],"Target":[82],"low-rank":[86],"transformation,":[88],"applies":[90],"at":[92],"inference":[93],"time":[94],"elicit":[96],"behavior.":[98],"Experiments":[99],"reasoning":[101,121,138,190],"behaviors,":[102],"including":[103],"Chain-of-Thought":[104],"(CoT)":[105],"mathematical":[107,137],"reasoning,":[108],"demonstrate":[109],"substantial":[110],"improvements":[111],"scales":[114],"training.":[116],"For":[117],"example,":[118],"transferring":[119,135],"CoT":[120],"from":[122,140,148],"Qwen1.5-14B":[123],"Qwen1.5-7B":[125],"yields":[126],"an":[127],"accuracy":[128,147],"gain":[129],"of":[130,167],"12.1%":[131],"MATH,":[133],"Qwen3-4B-Base":[141],"Qwen3-14B-Base":[143],"improves":[144],"AGIEval":[145],"Math":[146],"61.1%":[149],"71.3%,":[151],"surpassing":[152],"67.8%":[154],"achieved":[155],"14B":[158],"model.":[160],"Our":[161],"analysis":[162],"shows":[163],"success":[166],"depends":[169],"learned":[173],"during":[174],"pre-training,":[175],"our":[178],"intervention":[179],"amplifies":[180],"sharpening":[184],"output":[186],"distribution":[187],"toward":[188],"successful":[189],"trajectories.":[191]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-10T00:00:00"}
