{"id":"https://openalex.org/W4391897126","doi":"https://doi.org/10.1145/3648472","title":"Redefining Counterfactual Explanations for Reinforcement Learning: Overview, Challenges and Opportunities","display_name":"Redefining Counterfactual Explanations for Reinforcement Learning: Overview, Challenges and Opportunities","publication_year":2024,"publication_date":"2024-02-17","ids":{"openalex":"https://openalex.org/W4391897126","doi":"https://doi.org/10.1145/3648472"},"language":"en","primary_location":{"id":"doi:10.1145/3648472","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3648472","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3648472","source":{"id":"https://openalex.org/S157921468","display_name":"ACM Computing Surveys","issn_l":"0360-0300","issn":["0360-0300","1557-7341"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Computing Surveys","raw_type":"journal-article"},"type":"review","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3648472","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029228044","display_name":"Jasmina Gajcin","orcid":"https://orcid.org/0000-0002-8731-1236"},"institutions":[{"id":"https://openalex.org/I205274468","display_name":"Trinity College Dublin","ror":"https://ror.org/02tyrky19","country_code":"IE","type":"education","lineage":["https://openalex.org/I205274468"]}],"countries":["IE"],"is_corresponding":true,"raw_author_name":"Jasmina Gajcin","raw_affiliation_strings":["Trinity College Dublin, Dublin, Ireland"],"affiliations":[{"raw_affiliation_string":"Trinity College Dublin, Dublin, Ireland","institution_ids":["https://openalex.org/I205274468"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059738292","display_name":"Ivana Duspari\u0107","orcid":"https://orcid.org/0000-0003-0621-5400"},"institutions":[{"id":"https://openalex.org/I205274468","display_name":"Trinity College Dublin","ror":"https://ror.org/02tyrky19","country_code":"IE","type":"education","lineage":["https://openalex.org/I205274468"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Ivana Dusparic","raw_affiliation_strings":["Trinity College Dublin, Dublin, Ireland"],"affiliations":[{"raw_affiliation_string":"Trinity College Dublin, Dublin, Ireland","institution_ids":["https://openalex.org/I205274468"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5029228044"],"corresponding_institution_ids":["https://openalex.org/I205274468"],"apc_list":null,"apc_paid":null,"fwci":5.7518,"has_fulltext":true,"cited_by_count":16,"citation_normalized_percentile":{"value":0.96388029,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"56","issue":"9","first_page":"1","last_page":"33"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.989799976348877,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.9686700105667114},{"id":"https://openalex.org/keywords/counterfactual-conditional","display_name":"Counterfactual conditional","score":0.9627344608306885},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.814433217048645},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7792657613754272},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5825845003128052},{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.5564975142478943},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.46795713901519775},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4647025465965271},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3654763698577881},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.13293617963790894},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.08271336555480957},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.07611185312271118},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.07537660002708435}],"concepts":[{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.9686700105667114},{"id":"https://openalex.org/C71889745","wikidata":"https://www.wikidata.org/wiki/Q1783264","display_name":"Counterfactual conditional","level":3,"score":0.9627344608306885},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.814433217048645},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7792657613754272},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5825845003128052},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.5564975142478943},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.46795713901519775},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4647025465965271},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3654763698577881},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.13293617963790894},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.08271336555480957},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.07611185312271118},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.07537660002708435}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3648472","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3648472","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3648472","source":{"id":"https://openalex.org/S157921468","display_name":"ACM Computing Surveys","issn_l":"0360-0300","issn":["0360-0300","1557-7341"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Computing Surveys","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3648472","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3648472","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3648472","source":{"id":"https://openalex.org/S157921468","display_name":"ACM Computing Surveys","issn_l":"0360-0300","issn":["0360-0300","1557-7341"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Computing Surveys","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Partnerships for the goals","id":"https://metadata.un.org/sdg/17","score":0.41999998688697815}],"awards":[{"id":"https://openalex.org/G2322257346","display_name":null,"funder_award_id":"18/CRT/622","funder_id":"https://openalex.org/F4320320847","funder_display_name":"Science Foundation Ireland"},{"id":"https://openalex.org/G2394637485","display_name":null,"funder_award_id":"18/CRT/6223","funder_id":"https://openalex.org/F4320320847","funder_display_name":"Science Foundation Ireland"},{"id":"https://openalex.org/G4915346836","display_name":null,"funder_award_id":"18/CRT/6","funder_id":"https://openalex.org/F4320320847","funder_display_name":"Science Foundation Ireland"}],"funders":[{"id":"https://openalex.org/F4320320847","display_name":"Science Foundation Ireland","ror":"https://ror.org/0271asj38"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4391897126.pdf","grobid_xml":"https://content.openalex.org/works/W4391897126.grobid-xml"},"referenced_works_count":112,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1977655452","https://openalex.org/W1987725948","https://openalex.org/W2005267223","https://openalex.org/W2100556411","https://openalex.org/W2115668428","https://openalex.org/W2126105956","https://openalex.org/W2129888542","https://openalex.org/W2136815777","https://openalex.org/W2156682402","https://openalex.org/W2169393322","https://openalex.org/W2173248099","https://openalex.org/W2282821441","https://openalex.org/W2460163328","https://openalex.org/W2462906003","https://openalex.org/W2493343568","https://openalex.org/W2584650420","https://openalex.org/W2622408375","https://openalex.org/W2765204106","https://openalex.org/W2769421449","https://openalex.org/W2777473055","https://openalex.org/W2789367970","https://openalex.org/W2796290181","https://openalex.org/W2800002784","https://openalex.org/W2883386984","https://openalex.org/W2884552039","https://openalex.org/W2891340972","https://openalex.org/W2892341857","https://openalex.org/W2901312569","https://openalex.org/W2920396325","https://openalex.org/W2942608247","https://openalex.org/W2945151003","https://openalex.org/W2945295328","https://openalex.org/W2952561542","https://openalex.org/W2958608582","https://openalex.org/W2962681511","https://openalex.org/W2962851944","https://openalex.org/W2962966435","https://openalex.org/W2963095307","https://openalex.org/W2963735256","https://openalex.org/W2963767194","https://openalex.org/W2963864421","https://openalex.org/W2966032590","https://openalex.org/W2966362896","https://openalex.org/W2967394917","https://openalex.org/W2969499763","https://openalex.org/W2973319951","https://openalex.org/W2977229822","https://openalex.org/W2994120362","https://openalex.org/W2994363832","https://openalex.org/W2996001543","https://openalex.org/W2998004401","https://openalex.org/W3003533476","https://openalex.org/W3003931103","https://openalex.org/W3003997138","https://openalex.org/W3013495647","https://openalex.org/W3019132020","https://openalex.org/W3029567494","https://openalex.org/W3034616174","https://openalex.org/W3038092671","https://openalex.org/W3039116038","https://openalex.org/W3082925502","https://openalex.org/W3090027660","https://openalex.org/W3090832565","https://openalex.org/W3092625790","https://openalex.org/W3094413969","https://openalex.org/W3094613840","https://openalex.org/W3099331386","https://openalex.org/W3100789280","https://openalex.org/W3101038122","https://openalex.org/W3101981467","https://openalex.org/W3103795814","https://openalex.org/W3104149808","https://openalex.org/W3104515094","https://openalex.org/W3116073702","https://openalex.org/W3124373176","https://openalex.org/W3125831310","https://openalex.org/W3125997628","https://openalex.org/W3129402291","https://openalex.org/W3135487809","https://openalex.org/W3161731903","https://openalex.org/W3164011142","https://openalex.org/W3172765376","https://openalex.org/W3185122822","https://openalex.org/W3194396392","https://openalex.org/W3202810143","https://openalex.org/W3209179910","https://openalex.org/W4220970489","https://openalex.org/W4221160215","https://openalex.org/W4225150645","https://openalex.org/W4226251505","https://openalex.org/W4226332514","https://openalex.org/W4231827019","https://openalex.org/W4287125114","https://openalex.org/W4287278746","https://openalex.org/W4287871975","https://openalex.org/W4288058262","https://openalex.org/W4288363736","https://openalex.org/W4297812478","https://openalex.org/W4297814571","https://openalex.org/W4297821991","https://openalex.org/W4298235707","https://openalex.org/W4298857966","https://openalex.org/W4322619403","https://openalex.org/W6637162671","https://openalex.org/W6637967152","https://openalex.org/W6718836005","https://openalex.org/W6766649691","https://openalex.org/W6780298458","https://openalex.org/W6790717558","https://openalex.org/W6966940381","https://openalex.org/W7027579263"],"related_works":["https://openalex.org/W2056582926","https://openalex.org/W3137864021","https://openalex.org/W2162910442","https://openalex.org/W2079879923","https://openalex.org/W4200271736","https://openalex.org/W2104420793","https://openalex.org/W3017854570","https://openalex.org/W2028689793","https://openalex.org/W4313936361","https://openalex.org/W4242448314"],"abstract_inverted_index":{"While":[0,89],"AI":[1,39,87],"algorithms":[2],"have":[3],"shown":[4],"remarkable":[5],"success":[6],"in":[7,61,92,120,129,132,143,161,177],"various":[8],"fields,":[9],"their":[10,15],"lack":[11],"of":[12,35,67,115,157],"transparency":[13],"hinders":[14],"application":[16],"to":[17,71,101],"real-life":[18],"tasks.":[19],"Although":[20],"explanations":[21,48,51,131,142],"targeted":[22],"at":[23],"non-experts":[24],"are":[25,40,49,74,96],"necessary":[26],"for":[27,38,64,80,112,168,174],"user":[28],"trust":[29],"and":[30,44,76,146,148,170],"human-AI":[31],"collaboration,":[32],"the":[33,62,65,68,82,86,110,113,126,138,150,155],"majority":[34],"explanation":[36,118],"methods":[37,98,158],"focused":[41],"on":[42,56],"developers":[43],"expert":[45],"users.":[46],"Counterfactual":[47],"local":[50],"that":[52,153],"offer":[53],"users":[54],"advice":[55,79],"what":[57],"can":[58],"be":[59],"changed":[60],"input":[63],"output":[66,84],"black-box":[69],"model":[70],"change.":[72],"Counterfactuals":[73],"user-friendly":[75],"provide":[77],"actionable":[78],"achieving":[81],"desired":[83],"from":[85,159],"system.":[88],"extensively":[90],"researched":[91],"supervised":[93,133,144,160],"learning,":[94],"there":[95],"few":[97],"applying":[99],"them":[100],"reinforcement":[102,162],"learning":[103,145],"(RL).":[104],"In":[105],"this":[106],"work,":[107],"we":[108,136,165],"explore":[109,137],"reasons":[111],"underrepresentation":[114],"a":[116],"powerful":[117],"method":[119],"RL.":[121,178],"We":[122],"start":[123],"by":[124],"reviewing":[125],"current":[127],"work":[128],"counterfactual":[130,141],"learning.":[134,163],"Additionally,":[135],"differences":[139],"between":[140],"RL":[147,169],"identify":[149],"main":[151],"challenges":[152],"prevent":[154],"adoption":[156],"Finally,":[164],"redefine":[166],"counterfactuals":[167,176],"propose":[171],"research":[172],"directions":[173],"implementing":[175]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":4}],"updated_date":"2026-03-14T08:43:22.919905","created_date":"2025-10-10T00:00:00"}
