{"id":"https://openalex.org/W4390833810","doi":"https://doi.org/10.48550/arxiv.2401.06122","title":"Manipulating Feature Visualizations with Gradient Slingshots","display_name":"Manipulating Feature Visualizations with Gradient Slingshots","publication_year":2024,"publication_date":"2024-01-11","ids":{"openalex":"https://openalex.org/W4390833810","doi":"https://doi.org/10.48550/arxiv.2401.06122"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2401.06122","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.06122","pdf_url":"https://arxiv.org/pdf/2401.06122","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2401.06122","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082253730","display_name":"Dilyara Bareeva","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bareeva, Dilyara","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026720807","display_name":"Marina M. -C. H\u00f6hne","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"H\u00f6hne, Marina M. -C.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070293380","display_name":"Alexander Warnecke","orcid":"https://orcid.org/0009-0006-3617-3968"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Warnecke, Alexander","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049436073","display_name":"Lukas Pirch","orcid":"https://orcid.org/0009-0003-9185-780X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pirch, Lukas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107838719","display_name":"Klaus\u2010Robert M\u00fcller","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"M\u00fcller, Klaus-Robert","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066077721","display_name":"Konrad Rieck","orcid":"https://orcid.org/0000-0002-5054-8758"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rieck, Konrad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Lapuschkin, Sebastian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lapuschkin, Sebastian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Bykov, Kirill","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bykov, Kirill","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5082253730"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8254140019416809},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.626166582107544},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.61180579662323},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5978984236717224},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5187333226203918},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.5003218650817871},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.4988133907318115},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.46160903573036194},{"id":"https://openalex.org/keywords/masking","display_name":"Masking (illustration)","score":0.4599977433681488},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.4200797975063324}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8254140019416809},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.626166582107544},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.61180579662323},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5978984236717224},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5187333226203918},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.5003218650817871},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.4988133907318115},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46160903573036194},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.4599977433681488},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.4200797975063324},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2401.06122","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.06122","pdf_url":"https://arxiv.org/pdf/2401.06122","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2401.06122","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2401.06122","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2401.06122","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2401.06122","pdf_url":"https://arxiv.org/pdf/2401.06122","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.8299999833106995,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G1585467943","display_name":null,"funder_award_id":"101093003","funder_id":"https://openalex.org/F4320334322","funder_display_name":"HORIZON EUROPE Framework Programme"},{"id":"https://openalex.org/G18682879","display_name":null,"funder_award_id":"390781972","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G3515353610","display_name":null,"funder_award_id":"01IS20055","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G352791218","display_name":null,"funder_award_id":"(BMBF)","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G5219130566","display_name":null,"funder_award_id":"EU Horizon","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G5717916917","display_name":null,"funder_award_id":"39078197","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G6052429835","display_name":null,"funder_award_id":"(DFG)","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G6955755495","display_name":null,"funder_award_id":"Germany","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"},{"id":"https://openalex.org/G7257732812","display_name":null,"funder_award_id":"101093003","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G7686223061","display_name":null,"funder_award_id":"101189689","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8318064016","display_name":null,"funder_award_id":"Horizon","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"},{"id":"https://openalex.org/F4320334322","display_name":"HORIZON EUROPE Framework Programme","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4390833810.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2068608913","https://openalex.org/W3124914020","https://openalex.org/W2141033859","https://openalex.org/W3081694532","https://openalex.org/W2077542787","https://openalex.org/W2156434174","https://openalex.org/W2071701083","https://openalex.org/W2383687187","https://openalex.org/W2070401501","https://openalex.org/W2121496884"],"abstract_inverted_index":{"Feature":[0],"Visualization":[1],"(FV)":[2],"is":[3],"a":[4,24,43,66,78,102,121],"widely":[5],"used":[6],"technique":[7],"for":[8],"interpreting":[9],"concepts":[10],"learned":[11],"by":[12],"Deep":[13],"Neural":[14],"Networks":[15],"(DNNs),":[16],"which":[17],"synthesizes":[18],"input":[19],"patterns":[20],"that":[21,46],"maximally":[22],"activate":[23],"given":[25],"feature.":[26],"Despite":[27],"its":[28,90,127],"popularity,":[29],"the":[30,72],"trustworthiness":[31],"of":[32,65],"FV":[33,48,109],"explanations":[34],"has":[35],"received":[36],"limited":[37],"attention.":[38],"We":[39,81],"introduce":[40],"Gradient":[41],"Slingshots,":[42],"novel":[44],"method":[45],"enables":[47],"manipulation":[49],"without":[50],"modifying":[51],"model":[52],"architecture":[53],"or":[54],"significantly":[55],"degrading":[56],"performance.":[57],"By":[58],"shaping":[59],"new":[60],"trajectories":[61],"in":[62],"off-distribution":[63],"regions":[64],"feature's":[67],"activation":[68],"landscape,":[69],"we":[70,119],"coerce":[71],"optimization":[73],"process":[74],"to":[75,77,92],"converge":[76],"predefined":[79],"visualization.":[80],"evaluate":[82],"our":[83],"approach":[84],"on":[85,108],"several":[86],"DNN":[87],"architectures,":[88],"demonstrating":[89],"ability":[91],"replace":[93],"faithful":[94],"FVs":[95],"with":[96],"arbitrary":[97],"targets.":[98],"These":[99],"results":[100],"expose":[101],"critical":[103],"vulnerability:":[104],"auditors":[105],"relying":[106],"solely":[107],"may":[110],"accept":[111],"entirely":[112],"fabricated":[113],"explanations.":[114],"To":[115],"mitigate":[116],"this":[117],"risk,":[118],"propose":[120],"straightforward":[122],"defense":[123],"and":[124],"quantitatively":[125],"demonstrate":[126],"effectiveness.":[128]},"counts_by_year":[],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
