{"id":"https://openalex.org/W4401857392","doi":"https://doi.org/10.1145/3637528.3671595","title":"XRL-Bench: A Benchmark for Evaluating and Comparing Explainable Reinforcement Learning Techniques","display_name":"XRL-Bench: A Benchmark for Evaluating and Comparing Explainable Reinforcement Learning Techniques","publication_year":2024,"publication_date":"2024-08-24","ids":{"openalex":"https://openalex.org/W4401857392","doi":"https://doi.org/10.1145/3637528.3671595"},"language":"en","primary_location":{"id":"doi:10.1145/3637528.3671595","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3637528.3671595","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030275295","display_name":"Yu Xiong","orcid":"https://orcid.org/0000-0002-9656-6193"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yu Xiong","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101779299","display_name":"Zhipeng Hu","orcid":"https://orcid.org/0000-0003-4367-0816"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhipeng Hu","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102523917","display_name":"Huang Ye","orcid":"https://orcid.org/0000-0003-3336-0785"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ye Huang","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069512988","display_name":"Runze Wu","orcid":"https://orcid.org/0000-0002-6986-5825"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Runze Wu","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006918020","display_name":"Kai Guan","orcid":"https://orcid.org/0000-0003-3582-3464"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Guan","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082897780","display_name":"Xingchen Fang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"XingChen Fang","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005205575","display_name":"Ji Tong Jiang","orcid":"https://orcid.org/0000-0002-9632-8400"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ji Jiang","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008041973","display_name":"Tianze Zhou","orcid":"https://orcid.org/0000-0001-6375-5206"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianze Zhou","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018405065","display_name":"Yujing Hu","orcid":"https://orcid.org/0000-0002-2714-0092"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"YuJing Hu","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067320802","display_name":"Haoyu Liu","orcid":"https://orcid.org/0000-0002-8998-1217"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoyu Liu","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112845879","display_name":"Tangjie Lyu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tangjie Lyu","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022008180","display_name":"Changjie Fan","orcid":"https://orcid.org/0000-0001-5420-0516"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changjie Fan","raw_affiliation_strings":["Fuxi AI Lab, NetEase Inc., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Fuxi AI Lab, NetEase Inc., Hangzhou, China","institution_ids":["https://openalex.org/I4210091137"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5030275295"],"corresponding_institution_ids":["https://openalex.org/I4210091137"],"apc_list":null,"apc_paid":null,"fwci":0.695,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.751855,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"6073","last_page":"6082"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9797999858856201,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9605000019073486,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.838902473449707},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7018222808837891},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6628586649894714},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.396994024515152},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.07547751069068909}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.838902473449707},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7018222808837891},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6628586649894714},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.396994024515152},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.07547751069068909},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3637528.3671595","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3637528.3671595","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W40975834","https://openalex.org/W1677182931","https://openalex.org/W1787224781","https://openalex.org/W2100171245","https://openalex.org/W2282821441","https://openalex.org/W2617547828","https://openalex.org/W2765566013","https://openalex.org/W2788403449","https://openalex.org/W2883535494","https://openalex.org/W2891830784","https://openalex.org/W2899455150","https://openalex.org/W2962843949","https://openalex.org/W2963672746","https://openalex.org/W2972122474","https://openalex.org/W2996061341","https://openalex.org/W2996896271","https://openalex.org/W2996988244","https://openalex.org/W2997560917","https://openalex.org/W2998004401","https://openalex.org/W3023586494","https://openalex.org/W3088310808","https://openalex.org/W3102824929","https://openalex.org/W3120778962","https://openalex.org/W3124922852","https://openalex.org/W3133543405","https://openalex.org/W3134840027","https://openalex.org/W3197200122","https://openalex.org/W3212249145","https://openalex.org/W4220970489","https://openalex.org/W4226313597","https://openalex.org/W4280578116","https://openalex.org/W4283396845","https://openalex.org/W4287278739","https://openalex.org/W4287906792"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2378211422","https://openalex.org/W2745001401","https://openalex.org/W4321353415","https://openalex.org/W2130974462","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W972276598","https://openalex.org/W2087343574"],"abstract_inverted_index":{"Reinforcement":[0],"Learning":[1],"(RL)":[2],"has":[3],"demonstrated":[4],"substantial":[5],"potential":[6],"across":[7],"diverse":[8],"fields,":[9],"yet":[10],"understanding":[11],"its":[12],"decision-making":[13],"process,":[14],"especially":[15],"in":[16,32,156],"real-world":[17,157],"scenarios":[18],"where":[19],"rationality":[20],"and":[21,93,109,126,133,145,161,171],"safety":[22],"are":[23],"paramount,":[24],"is":[25],"an":[26,70,143,163],"ongoing":[27],"challenge.":[28],"This":[29],"paper":[30],"delves":[31],"to":[33],"Explainable":[34,40],"RL":[35,49,119],"(XRL),":[36],"a":[37,57,84,101],"subfield":[38],"of":[39,48,83,90,111,154,173,182],"AI":[41],"(XAI)":[42],"aimed":[43],"at":[44,73],"unravelling":[45],"the":[46,66,81,107,151,168,179],"complexities":[47],"models.":[50],"Our":[51,176],"focus":[52],"rests":[53],"on":[54,123],"state-explaining":[55],"techniques,":[56],"crucial":[58],"subset":[59],"within":[60],"XRL":[61,112,147,174,183],"methods,":[62,113],"as":[63],"they":[64],"reveal":[65],"underlying":[67],"factors":[68],"influencing":[69],"agent's":[71],"actions":[72],"any":[74],"given":[75],"time.":[76],"Despite":[77],"their":[78,91],"significant":[79],"role,":[80],"lack":[82],"unified":[85,102],"evaluation":[86,108,172],"framework":[87],"hinders":[88],"assessment":[89],"accuracy":[92],"effectiveness.":[94],"To":[95],"address":[96],"this,":[97],"we":[98],"introduce":[99],"XRL-Bench,":[100],"standardized":[103],"benchmark":[104,165],"tailored":[105],"for":[106,136,167],"comparison":[110],"encompassing":[114],"three":[115],"main":[116],"modules:":[117],"standard":[118,127],"environments,":[120],"explainers":[121],"based":[122],"state":[124,137],"importance,":[125],"evaluators.":[128],"XRL-Bench":[129],"supports":[130],"both":[131],"tabular":[132],"image":[134],"data":[135],"explanation.":[138],"We":[139,149],"also":[140],"propose":[141],"TabularSHAP,":[142],"innovative":[144],"competitive":[146],"method.":[148],"demonstrate":[150],"practical":[152],"utility":[153],"TabularSHAP":[155],"online":[158],"gaming":[159],"services":[160],"offer":[162],"open-source":[164],"platform":[166],"straightforward":[169],"implementation":[170],"methods.":[175],"contributions":[177],"facilitate":[178],"continued":[180],"progression":[181],"technology.":[184]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
