{"id":"https://openalex.org/W7147544269","doi":"https://doi.org/10.48550/arxiv.2603.28744","title":"Stop Probing, Start Coding: Why Linear Probes and Sparse Autoencoders Fail at Compositional Generalisation","display_name":"Stop Probing, Start Coding: Why Linear Probes and Sparse Autoencoders Fail at Compositional Generalisation","publication_year":2026,"publication_date":"2026-03-30","ids":{"openalex":"https://openalex.org/W7147544269","doi":"https://doi.org/10.48550/arxiv.2603.28744"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.28744","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.28744","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.28744","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132679608","display_name":"Vit\u00f3ria Barin Pacela","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Pacela, Vit\u00f3ria Barin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132562645","display_name":"Shruti Joshi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Joshi, Shruti","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132670135","display_name":"Isabela Camacho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Camacho, Isabela","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051076050","display_name":"Simon Lacoste-Julien","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lacoste-Julien, Simon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5059395392","display_name":"David Klindt","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Klindt, David","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5132679608"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.2567000091075897,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.2567000091075897,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.22059999406337738,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.16760000586509705,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.761900007724762},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5054000020027161},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.47859999537467957},{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.4772999882698059},{"id":"https://openalex.org/keywords/neural-coding","display_name":"Neural coding","score":0.4674000144004822},{"id":"https://openalex.org/keywords/sparse-approximation","display_name":"Sparse approximation","score":0.4239000082015991},{"id":"https://openalex.org/keywords/k-svd","display_name":"K-SVD","score":0.41909998655319214},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36320000886917114},{"id":"https://openalex.org/keywords/determinantal-point-process","display_name":"Determinantal point process","score":0.3617999851703644},{"id":"https://openalex.org/keywords/projection","display_name":"Projection (relational algebra)","score":0.349700003862381}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.761900007724762},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6376000046730042},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5724999904632568},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5054000020027161},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.47859999537467957},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.4772999882698059},{"id":"https://openalex.org/C77637269","wikidata":"https://www.wikidata.org/wiki/Q7002051","display_name":"Neural coding","level":2,"score":0.4674000144004822},{"id":"https://openalex.org/C124066611","wikidata":"https://www.wikidata.org/wiki/Q28684319","display_name":"Sparse approximation","level":2,"score":0.4239000082015991},{"id":"https://openalex.org/C154771677","wikidata":"https://www.wikidata.org/wiki/Q17098361","display_name":"K-SVD","level":3,"score":0.41909998655319214},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40849998593330383},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36320000886917114},{"id":"https://openalex.org/C72010251","wikidata":"https://www.wikidata.org/wiki/Q5265688","display_name":"Determinantal point process","level":4,"score":0.3617999851703644},{"id":"https://openalex.org/C57493831","wikidata":"https://www.wikidata.org/wiki/Q3134666","display_name":"Projection (relational algebra)","level":2,"score":0.349700003862381},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3488999903202057},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.3314000070095062},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.31450000405311584},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.31439998745918274},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3052000105381012},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.30169999599456787},{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.2989000082015991},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.2946000099182129},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.29350000619888306},{"id":"https://openalex.org/C88626702","wikidata":"https://www.wikidata.org/wiki/Q1128903","display_name":"Continuation","level":2,"score":0.28610000014305115},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.27900001406669617},{"id":"https://openalex.org/C2777472644","wikidata":"https://www.wikidata.org/wiki/Q16968992","display_name":"Approximate inference","level":3,"score":0.27410000562667847},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2712000012397766},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C41045048","wikidata":"https://www.wikidata.org/wiki/Q202843","display_name":"Linear programming","level":2,"score":0.26350000500679016},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C42023084","wikidata":"https://www.wikidata.org/wiki/Q5249231","display_name":"Decision boundary","level":3,"score":0.25949999690055847},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2583000063896179}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.28744","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.28744","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.28744","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.28744","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.51658695936203,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"linear":[1,13,35,45],"representation":[2],"hypothesis":[3],"states":[4],"that":[5,112],"neural":[6],"network":[7],"activations":[8],"encode":[9],"high-level":[10],"concepts":[11],"as":[12,126,175,190],"mixtures.":[14],"However,":[15],"under":[16,104,198],"superposition,":[17],"this":[18,49,87],"encoding":[19],"is":[20,159],"a":[21,24,29,34,78,82,162,176],"projection":[22],"from":[23],"higher-dimensional":[25],"concept":[26,40],"space":[27,41],"into":[28,77],"lower-dimensional":[30],"activation":[31],"space,":[32],"and":[33,97,137,184],"decision":[36],"boundary":[37],"in":[38,133],"the":[39,71,114,122,127,139,145,151,157,172,191],"need":[42],"not":[43,121,149,180],"remain":[44],"after":[46],"projection.":[47],"In":[48],"setting,":[50],"classical":[51],"sparse":[52,75,196],"coding":[53],"methods":[54],"with":[55,141,161],"per-sample":[56,142],"iterative":[57],"inference":[58,76,123,197],"leverage":[59],"compressed":[60],"sensing":[61],"guarantees":[62],"to":[63,102,186],"recover":[64],"latent":[65,95],"factors.":[66],"Sparse":[67],"autoencoders":[68],"(SAEs),":[69],"on":[70,144],"other":[72],"hand,":[73],"amortise":[74],"fixed":[79],"encoder,":[80],"introducing":[81],"systematic":[83],"gap.":[84,152],"We":[85],"show":[86],"amortisation":[88,182],"gap":[89],"persists":[90],"across":[91],"training":[92],"set":[93],"sizes,":[94],"dimensions,":[96],"sparsity":[98],"levels,":[99],"causing":[100],"SAEs":[101],"fail":[103],"out-of-distribution":[105],"(OOD)":[106],"compositional":[107],"shifts.":[108],"Through":[109],"controlled":[110],"experiments":[111],"decompose":[113],"failure,":[115],"we":[116],"identify":[117],"dictionary":[118,147,164,177,188],"learning":[119,178,189],"--":[120,125],"procedure":[124],"binding":[128],"constraint:":[129],"SAE-learned":[130],"dictionaries":[131],"point":[132,185],"substantially":[134],"wrong":[135],"directions,":[136],"replacing":[138],"encoder":[140],"FISTA":[143],"same":[146],"does":[148],"close":[150],"An":[153],"oracle":[154],"baseline":[155],"proves":[156],"problem":[158,194],"solvable":[160],"good":[163],"at":[165],"all":[166],"scales":[167],"tested.":[168],"Our":[169],"results":[170],"reframe":[171],"SAE":[173],"failure":[174],"challenge,":[179],"an":[181],"problem,":[183],"scalable":[187],"key":[192],"open":[193],"for":[195],"superposition.":[199]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
