{"id":"https://openalex.org/W7140210059","doi":"https://doi.org/10.48550/arxiv.2603.21014","title":"CLT-Forge: A Scalable Library for Cross-Layer Transcoders and Attribution Graphs","display_name":"CLT-Forge: A Scalable Library for Cross-Layer Transcoders and Attribution Graphs","publication_year":2026,"publication_date":"2026-03-22","ids":{"openalex":"https://openalex.org/W7140210059","doi":"https://doi.org/10.48550/arxiv.2603.21014"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.21014","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21014","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.21014","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Draye, Florent","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Draye, Florent","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Harrasse, Abir","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Harrasse, Abir","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Palit, Vedant","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Palit, Vedant","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Wu, Tung-Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Tung-Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Liu, Jiarui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jiarui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Pandey, Punya Syon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pandey, Punya Syon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Wu, Roderick","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Roderick","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhang, Terry Jingchen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Terry Jingchen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Jin, Zhijing","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Zhijing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Sch\u00f6lkopf, Bernhard","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sch\u00f6lkopf, Bernhard","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9269999861717224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9269999861717224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.01590000092983246,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.013500000350177288,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.9689000248908997},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6796000003814697},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.49619999527931213},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4530999958515167},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.4374000132083893},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.4138999879360199},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.3625999987125397},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.3495999872684479}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.9689000248908997},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7738999724388123},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6796000003814697},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.5060999989509583},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.49619999527931213},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49230000376701355},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4530999958515167},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.4374000132083893},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.4138999879360199},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.367900013923645},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.3625999987125397},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.3495999872684479},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3273000121116638},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.32359999418258667},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.31310001015663147},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.28859999775886536},{"id":"https://openalex.org/C101814296","wikidata":"https://www.wikidata.org/wiki/Q5439685","display_name":"Feature model","level":3,"score":0.2849999964237213},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.2827000021934509},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.259799987077713}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.21014","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21014","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.21014","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21014","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6355955600738525,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Mechanistic":[0],"interpretability":[1,51,91,110],"seeks":[2],"to":[3,37,76],"understand":[4],"how":[5],"Large":[6],"Language":[7],"Models":[8],"(LLMs)":[9],"represent":[10],"and":[11,20,32,47,78,90,103,115,122,131],"process":[12],"information.":[13],"Recent":[14],"approaches":[15],"based":[16],"on":[17],"dictionary":[18],"learning":[19],"transcoders":[21],"enable":[22],"representing":[23],"model":[24,101],"computation":[25,119],"in":[26,52],"terms":[27],"of":[28,92],"sparse,":[29],"interpretable":[30],"features":[31,62],"their":[33,50],"interactions,":[34],"giving":[35],"rise":[36],"feature":[38,113],"attribution":[39,117],"graphs.":[40],"However,":[41],"these":[42],"graphs":[43],"are":[44],"often":[45],"large":[46],"redundant,":[48],"limiting":[49],"practice.":[53],"Cross-Layer":[54],"Transcoders":[55],"(CLTs)":[56],"address":[57],"this":[58],"issue":[59],"by":[60],"sharing":[61],"across":[63],"layers":[64],"while":[65],"preserving":[66],"layer-specific":[67],"decoding,":[68],"yielding":[69],"more":[70],"compact":[71],"representations,":[72],"but":[73],"remain":[74],"difficult":[75],"train":[77],"analyze":[79],"at":[80],"scale.":[81],"We":[82],"introduce":[83],"an":[84],"open-source":[85],"library":[86],"for":[87,112,134],"end-to-end":[88],"training":[89,99],"CLTs.":[93],"Our":[94,139],"framework":[95],"integrates":[96],"scalable":[97],"distributed":[98],"with":[100],"sharding":[102],"compressed":[104],"activation":[105],"caching,":[106],"a":[107,123,129],"unified":[108,132],"automated":[109],"pipeline":[111],"analysis":[114],"explanation,":[116],"graph":[118],"using":[120],"Circuit-Tracer,":[121],"flexible":[124],"visualization":[125],"interface.":[126],"This":[127],"provides":[128],"practical":[130],"solution":[133],"scaling":[135],"CLT-based":[136],"mechanistic":[137],"interpretability.":[138],"code":[140],"is":[141],"available":[142],"at:":[143],"https://github.com/LLM-Interp/CLT-Forge.":[144]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-25T00:00:00"}
