{"id":"https://openalex.org/W7154317394","doi":"https://doi.org/10.48550/arxiv.2604.09885","title":"What do your logits know? (The answer may surprise you!)","display_name":"What do your logits know? (The answer may surprise you!)","publication_year":2026,"publication_date":"2026-04-10","ids":{"openalex":"https://openalex.org/W7154317394","doi":"https://doi.org/10.48550/arxiv.2604.09885"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.09885","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.09885","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.09885","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000858764","display_name":"Masha Fedzechkina","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fedzechkina, Masha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133607724","display_name":"Eleonora Gualdoni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gualdoni, Eleonora","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133607196","display_name":"Rita Ramos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramos, Rita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130325089","display_name":"Sinead Williamson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Williamson, Sinead","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.36230000853538513,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.36230000853538513,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.0771000012755394,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.07249999791383743,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.6938999891281128},{"id":"https://openalex.org/keywords/surprise","display_name":"Surprise","score":0.44209998846054077},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.34700000286102295},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.34200000762939453},{"id":"https://openalex.org/keywords/information-model","display_name":"Information model","score":0.3393999934196472},{"id":"https://openalex.org/keywords/information-processing","display_name":"Information processing","score":0.3160000145435333},{"id":"https://openalex.org/keywords/complete-information","display_name":"Complete information","score":0.2935999929904938}],"concepts":[{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.6938999891281128},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5777000188827515},{"id":"https://openalex.org/C2780343955","wikidata":"https://www.wikidata.org/wiki/Q333173","display_name":"Surprise","level":2,"score":0.44209998846054077},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3677999973297119},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.34700000286102295},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.34200000762939453},{"id":"https://openalex.org/C21338462","wikidata":"https://www.wikidata.org/wiki/Q1662581","display_name":"Information model","level":2,"score":0.3393999934196472},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3382999897003174},{"id":"https://openalex.org/C87868495","wikidata":"https://www.wikidata.org/wiki/Q750843","display_name":"Information processing","level":2,"score":0.3160000145435333},{"id":"https://openalex.org/C113336015","wikidata":"https://www.wikidata.org/wiki/Q574010","display_name":"Complete information","level":2,"score":0.2935999929904938},{"id":"https://openalex.org/C140331021","wikidata":"https://www.wikidata.org/wiki/Q1868104","display_name":"Logit","level":2,"score":0.29350000619888306},{"id":"https://openalex.org/C2780378346","wikidata":"https://www.wikidata.org/wiki/Q1349983","display_name":"Leak","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.2578999996185303},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.2540000081062317},{"id":"https://openalex.org/C180198813","wikidata":"https://www.wikidata.org/wiki/Q121182","display_name":"Information system","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.09885","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.09885","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.09885","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.09885","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"work":[1],"has":[2],"shown":[3],"that":[4,38,104],"probing":[5],"model":[6,18,31,40],"internals":[7],"can":[8,116],"reveal":[9],"a":[10,49],"wealth":[11],"of":[12,24,57,83,135],"information":[13,28,37,58,71,119,131],"not":[14],"apparent":[15],"from":[16,68],"the":[17,22,39,53,69,74,84,92,111,136],"generations.":[19],"This":[20],"poses":[21],"risk":[23],"unintentional":[25],"or":[26],"malicious":[27],"leakage,":[29],"where":[30],"users":[32],"are":[33],"able":[34],"to":[35,98],"learn":[36],"owner":[41],"assumed":[42],"was":[43],"inaccessible.":[44],"Using":[45],"vision-language":[46],"models":[47],"as":[48,64,129,132],"testbed,":[50],"we":[51],"present":[52,120],"first":[54],"systematic":[55],"comparison":[56],"retained":[59],"at":[60],"different":[61],"\"representational":[62],"levels''":[63],"it":[65],"is":[66],"compressed":[67],"rich":[70],"encoded":[72],"in":[73,121,125],"residual":[75,85,138],"stream":[76,86],"through":[77],"two":[78],"natural":[79],"bottlenecks:":[80],"low-dimensional":[81],"projections":[82,134],"obtained":[87],"using":[88],"tuned":[89],"lens,":[90],"and":[91],"final":[93],"top-k":[94],"logits":[95],"most":[96],"likely":[97],"impact":[99],"model's":[100,112],"answer.":[101],"We":[102],"show":[103],"even":[105],"easily":[106],"accessible":[107],"bottlenecks":[108],"defined":[109],"by":[110],"top":[113],"logit":[114],"values":[115],"leak":[117],"task-irrelevant":[118],"an":[122],"image-based":[123],"query,":[124],"some":[126],"cases":[127],"revealing":[128],"much":[130],"direct":[133],"full":[137],"stream.":[139]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-15T00:00:00"}
