{"id":"https://openalex.org/W7141109117","doi":"https://doi.org/10.48550/arxiv.2603.24653","title":"From Weights to Concepts: Data-Free Interpretability of CLIP via Singular Vector Decomposition","display_name":"From Weights to Concepts: Data-Free Interpretability of CLIP via Singular Vector Decomposition","publication_year":2026,"publication_date":"2026-03-25","ids":{"openalex":"https://openalex.org/W7141109117","doi":"https://doi.org/10.48550/arxiv.2603.24653"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.24653","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24653","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.24653","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130736522","display_name":"Francesco Gentile","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gentile, Francesco","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128705746","display_name":"Nicola Dall'Asen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dall'Asen, Nicola","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101868306","display_name":"Francesco Tonini","orcid":"https://orcid.org/0000-0002-1938-3449"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tonini, Francesco","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130789382","display_name":"Massimiliano Mancini","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mancini, Massimiliano","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039878198","display_name":"Lorenzo Vaquero","orcid":"https://orcid.org/0000-0002-1874-3078"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vaquero, Lorenzo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130773169","display_name":"Elisa Ricci","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ricci, Elisa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.897599995136261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.897599995136261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.05959999933838844,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.010599999688565731,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.958299994468689},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.511900007724762},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.4964999854564667},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41780000925064087},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4077000021934509},{"id":"https://openalex.org/keywords/basis","display_name":"Basis (linear algebra)","score":0.4041000008583069}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.958299994468689},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5928000211715698},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5665000081062317},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.511900007724762},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.4964999854564667},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4187000095844269},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41780000925064087},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4077000021934509},{"id":"https://openalex.org/C12426560","wikidata":"https://www.wikidata.org/wiki/Q189569","display_name":"Basis (linear algebra)","level":2,"score":0.4041000008583069},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.3398999869823456},{"id":"https://openalex.org/C22789450","wikidata":"https://www.wikidata.org/wiki/Q420904","display_name":"Singular value decomposition","level":2,"score":0.32850000262260437},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.30250000953674316},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3003000020980835},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2867000102996826},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2824999988079071},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.27469998598098755},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2694000005722046}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.24653","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24653","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.24653","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24653","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"As":[0],"vision-language":[1],"models":[2],"are":[3],"deployed":[4],"at":[5],"scale,":[6],"understanding":[7],"their":[8],"internal":[9],"mechanisms":[10],"becomes":[11],"increasingly":[12],"critical.":[13],"Existing":[14],"interpretability":[15,107],"methods":[16],"predominantly":[17],"rely":[18],"on":[19],"activations,":[20],"making":[21],"them":[22,84],"dataset-dependent,":[23],"vulnerable":[24],"to":[25,31,112,136],"data":[26],"bias,":[27],"and":[28,69,106],"often":[29],"restricted":[30],"coarse":[32],"head-level":[33],"explanations.":[34],"We":[35,93],"introduce":[36],"SITH":[37,96,114,135],"(Semantic":[38],"Inspection":[39],"of":[40,90],"Transformer":[41],"Heads),":[42],"a":[43,79,145],"fully":[44],"data-free,":[45],"training-free":[46],"framework":[47],"that":[48,82,95,121],"directly":[49],"analyzes":[50],"CLIP's":[51],"vision":[52],"transformer":[53],"in":[54],"weight":[55],"space.":[56],"For":[57],"each":[58,71],"attention":[59],"head,":[60],"we":[61,133],"decompose":[62],"its":[63],"value-output":[64],"matrix":[65],"into":[66],"singular":[67],"vectors":[68],"interpret":[70],"one":[72],"via":[73],"COMP":[74],"(Coherent":[75],"Orthogonal":[76],"Matching":[77],"Pursuit),":[78],"new":[80,153],"algorithm":[81],"explains":[83],"as":[85],"sparse,":[86],"semantically":[87],"coherent":[88],"combinations":[89],"human-interpretable":[91],"concepts.":[92],"show":[94],"yields":[97],"coherent,":[98],"faithful":[99],"intra-head":[100],"explanations,":[101],"validated":[102],"through":[103],"reconstruction":[104],"fidelity":[105],"experiments.":[108],"This":[109],"allows":[110],"us":[111],"use":[113,134],"for":[115],"precise,":[116],"interpretable":[117],"weight-space":[118],"model":[119,138],"edits":[120],"amplify":[122],"or":[123],"suppress":[124],"specific":[125],"concepts,":[126],"improving":[127],"downstream":[128],"performance":[129],"without":[130],"retraining.":[131],"Furthermore,":[132],"study":[137],"adaptation,":[139],"showing":[140],"how":[141],"fine-tuning":[142],"primarily":[143],"reweights":[144],"stable":[146],"semantic":[147],"basis":[148],"rather":[149],"than":[150],"learning":[151],"entirely":[152],"features.":[154]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-28T00:00:00"}
