{"id":"https://openalex.org/W7155793825","doi":"https://doi.org/10.48550/arxiv.2604.22662","title":"Rethinking XAI Evaluation: A Human-Centered Audit of Shapley Benchmarks in High-Stakes Settings","display_name":"Rethinking XAI Evaluation: A Human-Centered Audit of Shapley Benchmarks in High-Stakes Settings","publication_year":2026,"publication_date":"2026-04-24","ids":{"openalex":"https://openalex.org/W7155793825","doi":"https://doi.org/10.48550/arxiv.2604.22662"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.22662","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22662","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.22662","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086695956","display_name":"I. Oliveira e Silva","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Silva, In\u00eas Oliveira e","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134695500","display_name":"S\u00e9rgio Jesus","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jesus, S\u00e9rgio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049110696","display_name":"Iker Perez","orcid":"https://orcid.org/0000-0001-9400-4229"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Perez, Iker","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085639693","display_name":"Rita P. Ribeiro","orcid":"https://orcid.org/0000-0002-6852-8077"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ribeiro, Rita P.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124224435","display_name":"Carlos Soares","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Soares, Carlos","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134672507","display_name":"Hugo Ferreira","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ferreira, Hugo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5077752651","display_name":"Pedro Bizarro","orcid":"https://orcid.org/0000-0001-5281-1970"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bizarro, Pedro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5086695956"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.5292999744415283,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.5292999744415283,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.2856999933719635,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.07540000230073929,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/clarity","display_name":"CLARITY","score":0.785099983215332},{"id":"https://openalex.org/keywords/audit","display_name":"Audit","score":0.5054000020027161},{"id":"https://openalex.org/keywords/cornerstone","display_name":"Cornerstone","score":0.4388999938964844},{"id":"https://openalex.org/keywords/shapley-value","display_name":"Shapley value","score":0.36000001430511475},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.3334999978542328},{"id":"https://openalex.org/keywords/decision-analysis","display_name":"Decision analysis","score":0.29919999837875366}],"concepts":[{"id":"https://openalex.org/C2777146004","wikidata":"https://www.wikidata.org/wiki/Q14949826","display_name":"CLARITY","level":2,"score":0.785099983215332},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5270000100135803},{"id":"https://openalex.org/C199521495","wikidata":"https://www.wikidata.org/wiki/Q181487","display_name":"Audit","level":2,"score":0.5054000020027161},{"id":"https://openalex.org/C2780616401","wikidata":"https://www.wikidata.org/wiki/Q1133673","display_name":"Cornerstone","level":2,"score":0.4388999938964844},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3955000042915344},{"id":"https://openalex.org/C162118730","wikidata":"https://www.wikidata.org/wiki/Q1128453","display_name":"Actuarial science","level":1,"score":0.36250001192092896},{"id":"https://openalex.org/C199022921","wikidata":"https://www.wikidata.org/wiki/Q240046","display_name":"Shapley value","level":3,"score":0.36000001430511475},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.3334999978542328},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.3005000054836273},{"id":"https://openalex.org/C186116695","wikidata":"https://www.wikidata.org/wiki/Q5249226","display_name":"Decision analysis","level":2,"score":0.29919999837875366},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.29440000653266907},{"id":"https://openalex.org/C166052673","wikidata":"https://www.wikidata.org/wiki/Q83021","display_name":"Empirical evidence","level":2,"score":0.29170000553131104},{"id":"https://openalex.org/C32896092","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Risk management","level":2,"score":0.2913999855518341},{"id":"https://openalex.org/C11105738","wikidata":"https://www.wikidata.org/wiki/Q1895805","display_name":"Multiple-criteria decision analysis","level":2,"score":0.29100000858306885},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.2904999852180481},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.28130000829696655},{"id":"https://openalex.org/C12174686","wikidata":"https://www.wikidata.org/wiki/Q1058438","display_name":"Risk assessment","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C107327155","wikidata":"https://www.wikidata.org/wiki/Q330268","display_name":"Decision support system","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.2612000107765198}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.22662","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22662","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.22662","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22662","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.8204560279846191,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Shapley":[0,58],"values":[1],"are":[2,28,104,142],"a":[3,16,48,70,79,93,126],"cornerstone":[4],"of":[5,64,129],"explainable":[6],"AI,":[7],"yet":[8],"their":[9],"proliferation":[10],"into":[11],"competing":[12],"formulations":[13,156],"has":[14],"created":[15],"fragmented":[17],"landscape":[18],"with":[19,38],"little":[20],"consensus":[21],"on":[22,33],"practical":[23],"deployment.":[24],"While":[25],"theoretical":[26],"differences":[27,55],"well-documented,":[29],"evaluation":[30,73,140],"remains":[31],"reliant":[32],"quantitative":[34,97],"proxies":[35,141],"whose":[36],"alignment":[37],"human":[39,147],"utility":[40],"is":[41],"unverified.":[42],"In":[43],"this":[44],"work,":[45],"we":[46,150],"use":[47],"unified":[49],"amortized":[50],"framework":[51],"to":[52],"isolate":[53],"semantic":[54],"between":[56],"eight":[57],"variants":[59],"under":[60],"the":[61],"low-latency":[62],"constraints":[63],"operational":[65,160],"risk":[66,76,128],"workflows.":[67],"We":[68],"conduct":[69],"large-scale":[71],"empirical":[72],"across":[74],"four":[75],"datasets":[77],"and":[78,86,102,109,149,157],"realistic":[80],"fraud-detection":[81],"environment":[82],"involving":[83],"professional":[84],"analysts":[85],"3,735":[87],"case":[88],"reviews.":[89],"Our":[90],"results":[91],"reveal":[92],"fundamental":[94],"misalignment:":[95],"standard":[96],"metrics,":[98],"such":[99],"as":[100],"sparsity":[101],"faithfulness,":[103],"decoupled":[105],"from":[106],"human-perceived":[107],"clarity":[108],"decision":[110,123,161],"utility.":[111],"Furthermore,":[112],"while":[113],"no":[114],"formulation":[115],"improved":[116],"objective":[117],"analyst":[118],"performance,":[119],"explanations":[120],"consistently":[121],"increased":[122],"confidence,":[124],"signaling":[125],"critical":[127],"automation":[130],"bias":[131],"in":[132,159],"high-stakes":[133],"settings.":[134],"These":[135],"findings":[136],"suggest":[137],"that":[138],"current":[139],"insufficient":[143],"for":[144,154],"predicting":[145],"downstream":[146],"impact,":[148],"provide":[151],"evidence-based":[152],"guidance":[153],"selecting":[155],"metrics":[158],"systems.":[162]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-04-28T00:00:00"}
