{"id":"https://openalex.org/W4399802212","doi":"https://doi.org/10.1007/s10994-024-06549-4","title":"Improving interpretability via regularization of neural activation sensitivity","display_name":"Improving interpretability via regularization of neural activation sensitivity","publication_year":2024,"publication_date":"2024-06-19","ids":{"openalex":"https://openalex.org/W4399802212","doi":"https://doi.org/10.1007/s10994-024-06549-4"},"language":"en","primary_location":{"id":"doi:10.1007/s10994-024-06549-4","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-024-06549-4","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06549-4.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06549-4.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041715137","display_name":"Ofir Moshe","orcid":null},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Ofir Moshe","raw_affiliation_strings":["Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel"],"affiliations":[{"raw_affiliation_string":"Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel","institution_ids":["https://openalex.org/I124227911"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091561099","display_name":"Gil Fidel","orcid":null},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Gil Fidel","raw_affiliation_strings":["Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel"],"affiliations":[{"raw_affiliation_string":"Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel","institution_ids":["https://openalex.org/I124227911"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033439559","display_name":"Ron Bitton","orcid":"https://orcid.org/0000-0001-8942-9783"},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Ron Bitton","raw_affiliation_strings":["Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel"],"affiliations":[{"raw_affiliation_string":"Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel","institution_ids":["https://openalex.org/I124227911"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002391103","display_name":"Asaf Shabtai","orcid":"https://orcid.org/0000-0003-0630-4059"},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Asaf Shabtai","raw_affiliation_strings":["Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel"],"affiliations":[{"raw_affiliation_string":"Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, Beer-Sheva, Israel","institution_ids":["https://openalex.org/I124227911"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5041715137"],"corresponding_institution_ids":["https://openalex.org/I124227911"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":2.8095,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.91494088,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"113","issue":"9","first_page":"6165","last_page":"6196"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9440000057220459,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.9937618970870972},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6815372109413147},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6481303572654724},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.6403864026069641},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6357672214508057},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6103538870811462},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.5195784568786621},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5061823725700378},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.4843969941139221}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.9937618970870972},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6815372109413147},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6481303572654724},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.6403864026069641},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6357672214508057},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6103538870811462},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.5195784568786621},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5061823725700378},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.4843969941139221},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10994-024-06549-4","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-024-06549-4","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06549-4.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10994-024-06549-4","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10994-024-06549-4","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10994-024-06549-4.pdf","source":{"id":"https://openalex.org/S62148650","display_name":"Machine Learning","issn_l":"0885-6125","issn":["0885-6125","1573-0565"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7699999809265137,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320323051","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4399802212.pdf"},"referenced_works_count":44,"referenced_works":["https://openalex.org/W1787224781","https://openalex.org/W1881549354","https://openalex.org/W2108598243","https://openalex.org/W2112796928","https://openalex.org/W2282821441","https://openalex.org/W2302255633","https://openalex.org/W2618851150","https://openalex.org/W2657631929","https://openalex.org/W2794825826","https://openalex.org/W2809671526","https://openalex.org/W2945359720","https://openalex.org/W2962821226","https://openalex.org/W2962858109","https://openalex.org/W2963446712","https://openalex.org/W2963564844","https://openalex.org/W2963847595","https://openalex.org/W2964303497","https://openalex.org/W2978302387","https://openalex.org/W2979494945","https://openalex.org/W2991526369","https://openalex.org/W2995245581","https://openalex.org/W2996344901","https://openalex.org/W2996564870","https://openalex.org/W3009542902","https://openalex.org/W3015625436","https://openalex.org/W3028525609","https://openalex.org/W3035264434","https://openalex.org/W3043786973","https://openalex.org/W3090855408","https://openalex.org/W3094502228","https://openalex.org/W3102785203","https://openalex.org/W3113162324","https://openalex.org/W3118608800","https://openalex.org/W3119904598","https://openalex.org/W3129006292","https://openalex.org/W4229494842","https://openalex.org/W4235855427","https://openalex.org/W4241727697","https://openalex.org/W4384296820","https://openalex.org/W6729756640","https://openalex.org/W6734194636","https://openalex.org/W6755310938","https://openalex.org/W6762929394","https://openalex.org/W6766530665"],"related_works":["https://openalex.org/W2809283485","https://openalex.org/W4293768783","https://openalex.org/W4288347394","https://openalex.org/W2950183588","https://openalex.org/W3080754722","https://openalex.org/W4383221314","https://openalex.org/W3093978547","https://openalex.org/W2953536436","https://openalex.org/W3203790781","https://openalex.org/W4313346231"],"abstract_inverted_index":{"Abstract":[0],"State-of-the-art":[1],"deep":[2],"neural":[3,113],"networks":[4],"(DNNs)":[5],"are":[6,146,159],"highly":[7],"effective":[8],"at":[9],"tackling":[10],"many":[11],"real-world":[12,47],"tasks.":[13],"However,":[14],"their":[15,29,35],"widespread":[16],"adoption":[17],"in":[18,46,70,166,171],"mission-critical":[19],"contexts":[20],"is":[21,65,77,107],"limited":[22],"due":[23],"to":[24,31,67,126,148],"two":[25],"major":[26],"weaknesses":[27],"-":[28],"susceptibility":[30],"adversarial":[32,92,136],"attacks":[33],"and":[34,44,96,131,151],"opaqueness.":[36],"The":[37,56],"former":[38],"raises":[39],"concerns":[40],"about":[41],"DNNs\u2019":[42,104],"security":[43],"generalization":[45],"conditions,":[48],"while":[49],"the":[50,89,110,118],"latter,":[51],"opaqueness,":[52],"directly":[53],"impacts":[54],"interpretability.":[55],"lack":[57],"of":[58,91,112,120,128,168],"interpretability":[59,105,119],"diminishes":[60],"user":[61],"trust":[62],"as":[63],"it":[64],"challenging":[66],"have":[68],"confidence":[69],"a":[71,99],"model\u2019s":[72],"decision":[73],"when":[74],"its":[75],"reasoning":[76],"not":[78],"aligned":[79],"with":[80],"human":[81],"perspectives.":[82],"In":[83],"this":[84],"research,":[85],"we":[86],"(1)":[87],"examine":[88],"effect":[90],"robustness":[93,137],"on":[94,109],"interpretability,":[95],"(2)":[97],"present":[98],"novel":[100],"approach":[101],"for":[102],"improving":[103],"that":[106,127,142,152],"based":[108],"regularization":[111],"activation":[114],"sensitivity.":[115],"We":[116],"evaluate":[117],"models":[121,130,132,145,153,165],"trained":[122,133,154],"using":[123,134,155],"our":[124,156],"method":[125,158],"standard":[129,149],"state-of-the-art":[135],"techniques.":[138],"Our":[139],"results":[140],"show":[141],"adversarially":[143,163],"robust":[144,164],"superior":[147],"models,":[150],"proposed":[157],"even":[160],"better":[161],"than":[162],"terms":[167],"interpretability.(Code":[169],"provided":[170],"supplementary":[172],"material.)":[173]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-25T14:56:36.534964","created_date":"2025-10-10T00:00:00"}
