{"id":"https://openalex.org/W3005086430","doi":"https://doi.org/10.1145/3375627.3375830","title":"Fooling LIME and SHAP","display_name":"Fooling LIME and SHAP","publication_year":2020,"publication_date":"2020-02-05","ids":{"openalex":"https://openalex.org/W3005086430","doi":"https://doi.org/10.1145/3375627.3375830","mag":"3005086430"},"language":"en","primary_location":{"id":"doi:10.1145/3375627.3375830","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3375627.3375830","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3375627.3375830","source":{"id":"https://openalex.org/S5407048695","display_name":"Proceedings of the AAAI/ACM Conference on AI Ethics and Society","issn_l":"3065-8365","issn":["3065-8365"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI/ACM Conference on AI, Ethics, and Society","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3375627.3375830","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012515310","display_name":"Dylan Slack","orcid":"https://orcid.org/0000-0003-4186-2937"},"institutions":[{"id":"https://openalex.org/I204250578","display_name":"University of California, Irvine","ror":"https://ror.org/04gyf1771","country_code":"US","type":"education","lineage":["https://openalex.org/I204250578"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Dylan Slack","raw_affiliation_strings":["University of California, Irvine, Irvine, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Irvine, Irvine, CA, USA","institution_ids":["https://openalex.org/I204250578"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069982277","display_name":"Sophie Hilgard","orcid":null},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sophie Hilgard","raw_affiliation_strings":["Harvard University, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Harvard University, Cambridge, MA, USA","institution_ids":["https://openalex.org/I2801851002"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016456905","display_name":"Emily Jia","orcid":null},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Emily Jia","raw_affiliation_strings":["Harvard University, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Harvard University, Cambridge, MA, USA","institution_ids":["https://openalex.org/I2801851002"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005779128","display_name":"Sameer Singh","orcid":"https://orcid.org/0000-0003-0621-6323"},"institutions":[{"id":"https://openalex.org/I204250578","display_name":"University of California, Irvine","ror":"https://ror.org/04gyf1771","country_code":"US","type":"education","lineage":["https://openalex.org/I204250578"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sameer Singh","raw_affiliation_strings":["University of California, Irvine, Irvine, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Irvine, Irvine, CA, USA","institution_ids":["https://openalex.org/I204250578"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015520086","display_name":"Himabindu Lakkaraju","orcid":"https://orcid.org/0000-0001-7922-6544"},"institutions":[{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Himabindu Lakkaraju","raw_affiliation_strings":["Harvard University, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Harvard University, Cambridge, MA, USA","institution_ids":["https://openalex.org/I2801851002"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5012515310"],"corresponding_institution_ids":["https://openalex.org/I204250578"],"apc_list":null,"apc_paid":null,"fwci":46.8921,"has_fulltext":true,"cited_by_count":730,"citation_normalized_percentile":{"value":0.99886985,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"180","last_page":"186"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7384046316146851},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.7242454290390015},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5694364905357361},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.5672917366027832},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5425598621368408},{"id":"https://openalex.org/keywords/post-hoc","display_name":"Post hoc","score":0.4589371085166931},{"id":"https://openalex.org/keywords/toolbox","display_name":"Toolbox","score":0.4234752655029297},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.36148297786712646},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10221680998802185}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7384046316146851},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.7242454290390015},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5694364905357361},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.5672917366027832},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5425598621368408},{"id":"https://openalex.org/C2992886853","wikidata":"https://www.wikidata.org/wiki/Q18381816","display_name":"Post hoc","level":2,"score":0.4589371085166931},{"id":"https://openalex.org/C2777655017","wikidata":"https://www.wikidata.org/wiki/Q1501161","display_name":"Toolbox","level":2,"score":0.4234752655029297},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.36148297786712646},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10221680998802185},{"id":"https://openalex.org/C199343813","wikidata":"https://www.wikidata.org/wiki/Q12128","display_name":"Dentistry","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3375627.3375830","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3375627.3375830","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3375627.3375830","source":{"id":"https://openalex.org/S5407048695","display_name":"Proceedings of the AAAI/ACM Conference on AI Ethics and Society","issn_l":"3065-8365","issn":["3065-8365"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI/ACM Conference on AI, Ethics, and Society","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3375627.3375830","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3375627.3375830","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3375627.3375830","source":{"id":"https://openalex.org/S5407048695","display_name":"Proceedings of the AAAI/ACM Conference on AI Ethics and Society","issn_l":"3065-8365","issn":["3065-8365"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI/ACM Conference on AI, Ethics, and Society","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.800000011920929}],"awards":[{"id":"https://openalex.org/G3506203934","display_name":"CRII: RI: Explaining Decisions of Black-box Models via Input Perturbations","funder_award_id":"1756023","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G578852481","display_name":null,"funder_award_id":"#IIS-1756023","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320317052","display_name":"Allen Institute for Artificial Intelligence","ror":"https://ror.org/05w520734"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3005086430.pdf","grobid_xml":"https://content.openalex.org/works/W3005086430.grobid-xml"},"referenced_works_count":17,"referenced_works":["https://openalex.org/W2029199047","https://openalex.org/W2516809705","https://openalex.org/W2602024037","https://openalex.org/W2618851150","https://openalex.org/W2788007910","https://openalex.org/W2898694742","https://openalex.org/W2912477312","https://openalex.org/W2913039310","https://openalex.org/W2945976633","https://openalex.org/W2962790223","https://openalex.org/W2962843949","https://openalex.org/W2963399068","https://openalex.org/W2963483561","https://openalex.org/W3104310207","https://openalex.org/W3120740533","https://openalex.org/W3125203539","https://openalex.org/W4289097366"],"related_works":["https://openalex.org/W4205140848","https://openalex.org/W2068663075","https://openalex.org/W2978678743","https://openalex.org/W2502115930","https://openalex.org/W2797837731","https://openalex.org/W4393677513","https://openalex.org/W4390832911","https://openalex.org/W829257147","https://openalex.org/W2482350142","https://openalex.org/W4385302116"],"abstract_inverted_index":{"As":[0],"machine":[1],"learning":[2],"black":[3,29,51],"boxes":[4,30],"are":[5,37,73],"increasingly":[6],"being":[7,38],"deployed":[8],"in":[9,31,113],"domains":[10],"such":[11,68,114,166],"as":[12,69,167],"healthcare":[13],"and":[14,24,47,71,169],"criminal":[15],"justice,":[16],"there":[17],"is":[18],"growing":[19],"emphasis":[20],"on":[21,65,120],"building":[22],"tools":[23],"techniques":[25,62,165],"for":[26],"explaining":[27],"these":[28],"an":[32,94,99],"interpretable":[33],"manner.":[34],"Such":[35],"explanations":[36,61,132,174],"leveraged":[39],"by":[40,92,157],"domain":[41],"experts":[42],"to":[43,97,108],"diagnose":[44],"systematic":[45],"errors":[46],"underlying":[48,180],"biases":[49,87],"of":[50,88,133],"boxes.":[52],"In":[53],"this":[54],"paper,":[55],"we":[56,77,149],"demonstrate":[57,150],"that":[58,63,83,117],"post":[59,130],"hoc":[60,131],"rely":[64],"input":[66,122],"perturbations,":[67],"LIME":[70,168],"SHAP,":[72],"not":[74,177],"reliable.":[75],"Specifically,":[76],"propose":[78],"a":[79,115],"novel":[80],"scaffolding":[81],"technique":[82],"effectively":[84],"hides":[85],"the":[86,121,129,134,179],"any":[89,110],"given":[90],"classifier":[91,112,136],"allowing":[93],"adversarial":[95],"entity":[96],"craft":[98],"arbitrary":[100],"desired":[101],"explanation.":[102],"Our":[103],"approach":[104],"can":[105,160],"be":[106],"used":[107],"scaffold":[109],"biased":[111,153],"way":[116],"its":[118],"predictions":[119],"data":[123],"distribution":[124],"still":[125],"remain":[126],"biased,":[127],"but":[128],"scaffolded":[135],"look":[137],"innocuous.":[138],"Using":[139],"extensive":[140],"evaluation":[141],"with":[142],"multiple":[143],"real":[144],"world":[145],"datasets":[146],"(including":[147],"COMPAS),":[148],"how":[151],"extremely":[152],"(racist)":[154],"classifiers":[155],"crafted":[156],"our":[158],"framework":[159],"easily":[161],"fool":[162],"popular":[163],"explanation":[164],"SHAP":[170],"into":[171],"generating":[172],"innocuous":[173],"which":[175],"do":[176],"reflect":[178],"biases.":[181]},"counts_by_year":[{"year":2026,"cited_by_count":44},{"year":2025,"cited_by_count":172},{"year":2024,"cited_by_count":165},{"year":2023,"cited_by_count":126},{"year":2022,"cited_by_count":79},{"year":2021,"cited_by_count":108},{"year":2020,"cited_by_count":32},{"year":2019,"cited_by_count":4}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
