{"id":"https://openalex.org/W4312453724","doi":"https://doi.org/10.1109/tai.2022.3223892","title":"Explain the Explainer: Interpreting Model-Agnostic Counterfactual Explanations of a Deep Reinforcement Learning Agent","display_name":"Explain the Explainer: Interpreting Model-Agnostic Counterfactual Explanations of a Deep Reinforcement Learning Agent","publication_year":2022,"publication_date":"2022-11-24","ids":{"openalex":"https://openalex.org/W4312453724","doi":"https://doi.org/10.1109/tai.2022.3223892"},"language":"en","primary_location":{"id":"doi:10.1109/tai.2022.3223892","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2022.3223892","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://iris.uniroma1.it/bitstream/11573/1667241/1/Chen_postprint_Explain_2024.pdf.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101773785","display_name":"Ziheng Chen","orcid":"https://orcid.org/0000-0002-2585-637X"},"institutions":[{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ziheng Chen","raw_affiliation_strings":["Department of Applied Mathematics and Statistics, Stony Brook University, Stony Brook, NY, USA"],"affiliations":[{"raw_affiliation_string":"Department of Applied Mathematics and Statistics, Stony Brook University, Stony Brook, NY, USA","institution_ids":["https://openalex.org/I59553526"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044165871","display_name":"Fabrizio Silvestri","orcid":"https://orcid.org/0000-0001-7669-9055"},"institutions":[{"id":"https://openalex.org/I861853513","display_name":"Sapienza University of Rome","ror":"https://ror.org/02be6w209","country_code":"IT","type":"education","lineage":["https://openalex.org/I861853513"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Fabrizio Silvestri","raw_affiliation_strings":["Department of Computer Engineering and the Department of Computer Science, Sapienza University of Rome, Rome, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering and the Department of Computer Science, Sapienza University of Rome, Rome, Italy","institution_ids":["https://openalex.org/I861853513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011299100","display_name":"Gabriele Tolomei","orcid":"https://orcid.org/0000-0001-7471-6659"},"institutions":[{"id":"https://openalex.org/I861853513","display_name":"Sapienza University of Rome","ror":"https://ror.org/02be6w209","country_code":"IT","type":"education","lineage":["https://openalex.org/I861853513"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Gabriele Tolomei","raw_affiliation_strings":["Department of Computer Engineering and the Department of Computer Science, Sapienza University of Rome, Rome, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering and the Department of Computer Science, Sapienza University of Rome, Rome, Italy","institution_ids":["https://openalex.org/I861853513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100404643","display_name":"Jia Wang","orcid":"https://orcid.org/0000-0002-3165-7051"},"institutions":[{"id":"https://openalex.org/I69356397","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05","country_code":"CN","type":"education","lineage":["https://openalex.org/I69356397"]},{"id":"https://openalex.org/I861853513","display_name":"Sapienza University of Rome","ror":"https://ror.org/02be6w209","country_code":"IT","type":"education","lineage":["https://openalex.org/I861853513"]}],"countries":["CN","IT"],"is_corresponding":false,"raw_author_name":"Jia Wang","raw_affiliation_strings":["Department of Intelligent Science, Xi&#x0027;an Jiaotong-Liverpool University, Suzhou, China","Department of Computer Engineering and the Department of Computer Science, Sapienza University of Rome, Rome, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Intelligent Science, Xi&#x0027;an Jiaotong-Liverpool University, Suzhou, China","institution_ids":["https://openalex.org/I69356397"]},{"raw_affiliation_string":"Department of Computer Engineering and the Department of Computer Science, Sapienza University of Rome, Rome, Italy","institution_ids":["https://openalex.org/I861853513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004145814","display_name":"He Zhu","orcid":"https://orcid.org/0000-0001-9606-150X"},"institutions":[{"id":"https://openalex.org/I102322142","display_name":"Rutgers, The State University of New Jersey","ror":"https://ror.org/05vt9qd57","country_code":"US","type":"education","lineage":["https://openalex.org/I102322142"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"He Zhu","raw_affiliation_strings":["Department of Computer Science, Rutgers University&#x2013;New Brunswick, Piscataway, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Rutgers University&#x2013;New Brunswick, Piscataway, NJ, USA","institution_ids":["https://openalex.org/I102322142"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102758548","display_name":"Hongshik Ahn","orcid":"https://orcid.org/0000-0002-8924-6159"},"institutions":[{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hongshik Ahn","raw_affiliation_strings":["Department of Applied Mathematics and Statistics, Stony Brook University, Stony Brook, NY, USA"],"affiliations":[{"raw_affiliation_string":"Department of Applied Mathematics and Statistics, Stony Brook University, Stony Brook, NY, USA","institution_ids":["https://openalex.org/I59553526"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101773785"],"corresponding_institution_ids":["https://openalex.org/I59553526"],"apc_list":null,"apc_paid":null,"fwci":3.0536,"has_fulltext":true,"cited_by_count":22,"citation_normalized_percentile":{"value":0.92548701,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"5","issue":"4","first_page":"1443","last_page":"1457"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9639000296592712,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.8952949047088623},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7688457369804382},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7413648962974548},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7261198163032532},{"id":"https://openalex.org/keywords/counterfactual-conditional","display_name":"Counterfactual conditional","score":0.7015236020088196},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.7007858157157898},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.5316940546035767},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5105041265487671},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4619847238063812},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.431222528219223},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.07853084802627563}],"concepts":[{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.8952949047088623},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7688457369804382},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7413648962974548},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7261198163032532},{"id":"https://openalex.org/C71889745","wikidata":"https://www.wikidata.org/wiki/Q1783264","display_name":"Counterfactual conditional","level":3,"score":0.7015236020088196},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.7007858157157898},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.5316940546035767},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5105041265487671},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4619847238063812},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.431222528219223},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.07853084802627563},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tai.2022.3223892","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2022.3223892","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:iris.uniroma1.it:11573/1667241","is_oa":true,"landing_page_url":"https://hdl.handle.net/11573/1667241","pdf_url":"https://iris.uniroma1.it/bitstream/11573/1667241/1/Chen_postprint_Explain_2024.pdf.pdf","source":{"id":"https://openalex.org/S4377196107","display_name":"IRIS Research product catalog (Sapienza University of Rome)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:iris.uniroma1.it:11573/1667241","is_oa":true,"landing_page_url":"https://hdl.handle.net/11573/1667241","pdf_url":"https://iris.uniroma1.it/bitstream/11573/1667241/1/Chen_postprint_Explain_2024.pdf.pdf","source":{"id":"https://openalex.org/S4377196107","display_name":"IRIS Research product catalog (Sapienza University of Rome)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.8100000023841858}],"awards":[{"id":"https://openalex.org/G8091430692","display_name":null,"funder_award_id":"(MIUR)","funder_id":"https://openalex.org/F4320321873","funder_display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca"}],"funders":[{"id":"https://openalex.org/F4320317295","display_name":"Dipartimenti di Eccellenza","ror":null},{"id":"https://openalex.org/F4320321873","display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca","ror":"https://ror.org/0166hxq48"},{"id":"https://openalex.org/F4320324032","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4312453724.pdf","grobid_xml":"https://content.openalex.org/works/W4312453724.grobid-xml"},"referenced_works_count":61,"referenced_works":["https://openalex.org/W2022852506","https://openalex.org/W2091447598","https://openalex.org/W2107297861","https://openalex.org/W2144366468","https://openalex.org/W2243397390","https://openalex.org/W2256420211","https://openalex.org/W2612581922","https://openalex.org/W2715209044","https://openalex.org/W2739657930","https://openalex.org/W2803974723","https://openalex.org/W2888487581","https://openalex.org/W2891340972","https://openalex.org/W2897417898","https://openalex.org/W2909392392","https://openalex.org/W2945295328","https://openalex.org/W2953466973","https://openalex.org/W2963125461","https://openalex.org/W2964067469","https://openalex.org/W2967730222","https://openalex.org/W2979156612","https://openalex.org/W2979997102","https://openalex.org/W3000716014","https://openalex.org/W3019132020","https://openalex.org/W3023497337","https://openalex.org/W3034697737","https://openalex.org/W3041133507","https://openalex.org/W3043146651","https://openalex.org/W3081364375","https://openalex.org/W3092961465","https://openalex.org/W3094613840","https://openalex.org/W3096345829","https://openalex.org/W3099331386","https://openalex.org/W3099844187","https://openalex.org/W3101038122","https://openalex.org/W3102161834","https://openalex.org/W3104149808","https://openalex.org/W3104371626","https://openalex.org/W3125997628","https://openalex.org/W3202810143","https://openalex.org/W4214717370","https://openalex.org/W4220696590","https://openalex.org/W4293583991","https://openalex.org/W6637967152","https://openalex.org/W6640174482","https://openalex.org/W6684921986","https://openalex.org/W6687681856","https://openalex.org/W6745861399","https://openalex.org/W6749992176","https://openalex.org/W6751437432","https://openalex.org/W6751959524","https://openalex.org/W6754843927","https://openalex.org/W6755326576","https://openalex.org/W6756303580","https://openalex.org/W6756413876","https://openalex.org/W6762622100","https://openalex.org/W6769214901","https://openalex.org/W6779372675","https://openalex.org/W6784161558","https://openalex.org/W6785204124","https://openalex.org/W6797537360","https://openalex.org/W6840573628"],"related_works":["https://openalex.org/W2056582926","https://openalex.org/W3137864021","https://openalex.org/W2162910442","https://openalex.org/W2079879923","https://openalex.org/W4200271736","https://openalex.org/W2104420793","https://openalex.org/W3017854570","https://openalex.org/W2028689793","https://openalex.org/W4242448314","https://openalex.org/W3028884462"],"abstract_inverted_index":{"Counterfactual":[0],"examples":[1],"(CFs)":[2],"are":[3,39],"one":[4],"of":[5,28,74,117,125,173],"the":[6,26,72,85,110,115,123,171],"most":[7],"popular":[8],"methods":[9,23],"for":[10,43,48],"attaching":[11],"post-hoc":[12],"explanations":[13,184],"to":[14,41,54,64,105,121,154,158,162,176],"machine":[15],"learning":[16,91],"(ML)":[17],"models.":[18],"However,":[19],"existing":[20,142],"CF":[21,143],"generation":[22,144],"either":[24],"exploit":[25],"internals":[27],"specific":[29],"models":[30,45,157],"or":[31],"depend":[32],"on":[33,133],"each":[34],"sample's":[35],"neighborhood;":[36],"thus,":[37],"they":[38],"hard":[40],"generalize":[42],"complex":[44,155],"and":[46,58,160,165,180],"inefficient":[47],"large":[49],"datasets.":[50],"This":[51],"work":[52],"aims":[53],"overcome":[55],"these":[56],"limitations":[57],"introduces":[59],"RELAX,":[60],"a":[61,78,102,118],"model-agnostic":[62],"algorithm":[63,104],"generate":[65],"optimal":[66,86],"counterfactual":[67],"explanations.":[68],"Specifically,":[69],"we":[70,100,169],"formulate":[71],"problem":[73],"crafting":[75],"CFs":[76,87,127],"as":[77,146],"sequential":[79],"decision-making":[80],"task.":[81],"We":[82],"then":[83],"find":[84],"via":[88],"deep":[89],"reinforcement":[90],"(DRL)":[92],"with":[93],"discretecontinuous":[94],"hybrid":[95],"action":[96],"space.":[97],"In":[98],"addition,":[99],"develop":[101],"distillation":[103],"extract":[106],"decision":[107,119],"rules":[108],"from":[109],"DRL":[111],"agent's":[112],"policy":[113,183],"in":[114,185],"form":[116],"tree":[120],"make":[122],"process":[124],"generating":[126],"itself":[128],"interpretable.":[129],"Extensive":[130],"experiments":[131],"conducted":[132],"six":[134],"tabular":[135],"datasets":[136],"have":[137],"shown":[138],"that":[139],"RELAX":[140],"outperforms":[141],"baselines,":[145],"it":[147],"produces":[148],"sparser":[149],"counterfactuals,":[150],"is":[151],"more":[152],"scalable":[153],"target":[156],"explain,":[159],"generalizes":[161],"both":[163],"classification":[164],"regression":[166],"tasks.":[167],"Finally,":[168],"show":[170],"ability":[172],"our":[174],"method":[175],"provide":[177],"actionable":[178],"recommendations":[179],"distill":[181],"interpretable":[182],"two":[186],"practical,":[187],"real-world":[188],"use":[189],"cases.":[190]},"counts_by_year":[{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":6}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
