{"id":"https://openalex.org/W4383176552","doi":"https://doi.org/10.48550/arxiv.2307.00897","title":"Fixing confirmation bias in feature attribution methods via semantic match","display_name":"Fixing confirmation bias in feature attribution methods via semantic match","publication_year":2023,"publication_date":"2023-07-03","ids":{"openalex":"https://openalex.org/W4383176552","doi":"https://doi.org/10.48550/arxiv.2307.00897"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2307.00897","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.00897","pdf_url":"https://arxiv.org/pdf/2307.00897","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2307.00897","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044955303","display_name":"Giovanni Cin\u00e0","orcid":"https://orcid.org/0000-0002-3521-8208"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Cin\u00e0, Giovanni","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024112893","display_name":"Daniel Fern\u00e1ndez-Llaneza","orcid":"https://orcid.org/0000-0002-2770-4214"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fernandez-Llaneza, Daniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Deponte, Ludovico","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deponte, Ludovico","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075790745","display_name":"Nishant Mishra","orcid":"https://orcid.org/0000-0002-0946-6048"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mishra, Nishant","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019285489","display_name":"Tabea E. R\u00f6ber","orcid":"https://orcid.org/0009-0005-7089-5924"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"R\u00f6ber, Tabea E.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007142536","display_name":"Sandro Pezzelle","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pezzelle, Sandro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086777036","display_name":"Iacer Calixto","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Calixto, Iacer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044989654","display_name":"Rob Goedhart","orcid":"https://orcid.org/0000-0001-9966-0284"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goedhart, Rob","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5087647617","display_name":"\u015e. \u0130lker Birbil","orcid":"https://orcid.org/0000-0001-7472-7032"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Birbil, \u015e. \u0130lker","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5044955303"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9811000227928162,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spurious-relationship","display_name":"Spurious relationship","score":0.7851881384849548},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7165348529815674},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6799703240394592},{"id":"https://openalex.org/keywords/attribution","display_name":"Attribution","score":0.5532823204994202},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.530360758304596},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.48683470487594604},{"id":"https://openalex.org/keywords/semantic-feature","display_name":"Semantic feature","score":0.48318663239479065},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.48216742277145386},{"id":"https://openalex.org/keywords/interpretation","display_name":"Interpretation (philosophy)","score":0.4674091637134552},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.44443055987358093},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.4356839060783386},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.37580448389053345},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.36083120107650757},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3124167323112488},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.19537058472633362},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.12821853160858154},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.10581496357917786}],"concepts":[{"id":"https://openalex.org/C97256817","wikidata":"https://www.wikidata.org/wiki/Q1462316","display_name":"Spurious relationship","level":2,"score":0.7851881384849548},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7165348529815674},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6799703240394592},{"id":"https://openalex.org/C143299363","wikidata":"https://www.wikidata.org/wiki/Q900584","display_name":"Attribution","level":2,"score":0.5532823204994202},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.530360758304596},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48683470487594604},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.48318663239479065},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.48216742277145386},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.4674091637134552},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.44443055987358093},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.4356839060783386},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37580448389053345},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.36083120107650757},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3124167323112488},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.19537058472633362},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.12821853160858154},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.10581496357917786},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2307.00897","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.00897","pdf_url":"https://arxiv.org/pdf/2307.00897","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:pure.amsterdamumc.nl:openaire_cris_publications/6c75a82d-400a-4c84-a4dd-a32c93d16ecf","is_oa":true,"landing_page_url":"https://pure.amsterdamumc.nl/en/publications/6c75a82d-400a-4c84-a4dd-a32c93d16ecf","pdf_url":"https://pure.amsterdamumc.nl/files/109878031/2307.00897v1.pdf","source":{"id":"https://openalex.org/S7407055222","display_name":"Pure Amsterdam UMC","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Cin\u00e0, G, Fernandez-Llaneza, D, Mishra, N, R\u00f6ber, T E, Pezzelle, S, Calixto, I, Goedhart, R & Birbil, \u015e \u0130 2023 'Fixing confirmation bias in feature attribution methods via semantic match'.","raw_type":"info:eu-repo/semantics/preprint"},{"id":"doi:10.48550/arxiv.2307.00897","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2307.00897","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2307.00897","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.00897","pdf_url":"https://arxiv.org/pdf/2307.00897","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.6200000047683716,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4383176552.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3113091479","https://openalex.org/W2162899405","https://openalex.org/W941090075","https://openalex.org/W2044987316","https://openalex.org/W3134374554","https://openalex.org/W2237480245","https://openalex.org/W2103835134","https://openalex.org/W4238802473","https://openalex.org/W2034503175","https://openalex.org/W2036755558"],"abstract_inverted_index":{"Feature":[0],"attribution":[1],"methods":[2,26],"have":[3,22],"become":[4],"a":[5,29,36,61,80,127,141,179],"staple":[6],"method":[7],"to":[8,57,85,130,193],"disentangle":[9],"the":[10,91,96,104,115,138,153,191,203,208],"complex":[11],"behavior":[12],"of":[13,41,49,143,155,210],"black":[14],"box":[15],"models.":[16],"Despite":[17],"their":[18],"success,":[19],"some":[20],"scholars":[21],"argued":[23],"that":[24,79,199],"such":[25],"suffer":[27],"from":[28],"serious":[30],"flaw:":[31],"they":[32],"do":[33],"not":[34,53],"allow":[35],"reliable":[37],"interpretation":[38],"in":[39,120,134,140,213],"terms":[40],"human":[42,108],"concepts.":[43],"Simply":[44],"put,":[45],"visualizing":[46],"an":[47,167,188],"array":[48],"feature":[50,97],"contributions":[51],"is":[52,83,100],"enough":[54],"for":[55,170],"humans":[56],"conclude":[58],"something":[59],"about":[60,74],"model's":[62],"internal":[63],"representations,":[64],"and":[65,110,147,150,172,197],"confirmation":[66,211],"bias":[67,212],"can":[68,158],"trick":[69],"users":[70],"into":[71,161],"false":[72],"beliefs":[73],"model":[75,92,174],"behavior.":[76],"We":[77,136,182],"argue":[78,198],"structured":[81,128],"approach":[82,129,201],"required":[84],"test":[86],"whether":[87],"our":[88,184],"hypotheses":[89],"on":[90,114,166,178,190],"are":[93],"confirmed":[94],"by":[95],"attributions.":[98],"This":[99],"what":[101],"we":[102,125],"call":[103],"\"semantic":[105],"match\"":[106],"between":[107],"concepts":[109],"(sub-symbolic)":[111],"explanations.":[112],"Building":[113],"conceptual":[116],"framework":[117],"put":[118],"forward":[119],"Cin\u00e0":[121],"et":[122],"al.":[123],"[2023],":[124],"propose":[126],"evaluate":[131],"semantic":[132,156,195],"match":[133,157],"practice.":[135],"showcase":[137],"procedure":[139],"suite":[142],"experiments":[144],"spanning":[145],"tabular":[146],"image":[148],"data,":[149],"show":[151],"how":[152],"assessment":[154],"give":[159],"insight":[160],"both":[162],"desirable":[163],"(e.g.,":[164,176],"focusing":[165,177],"object":[168],"relevant":[169],"prediction)":[171],"undesirable":[173],"behaviors":[175],"spurious":[180],"correlation).":[181],"couple":[183],"experimental":[185],"results":[186],"with":[187],"analysis":[189],"metrics":[192],"measure":[194],"match,":[196],"this":[200],"constitutes":[202],"first":[204],"step":[205],"towards":[206],"resolving":[207],"issue":[209],"XAI.":[214]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-13T08:25:38.343686","created_date":"2023-07-05T00:00:00"}
