{"id":"https://openalex.org/W7118985982","doi":"https://doi.org/10.48550/arxiv.2601.00830","title":"Can We Trust AI Explanations? Evidence of Systematic Underreporting in Chain-of-Thought Reasoning","display_name":"Can We Trust AI Explanations? Evidence of Systematic Underreporting in Chain-of-Thought Reasoning","publication_year":2025,"publication_date":"2025-12-25","ids":{"openalex":"https://openalex.org/W7118985982","doi":"https://doi.org/10.48550/arxiv.2601.00830"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.00830","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00830","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.00830","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122169850","display_name":"Deep Pankajbhai Mehta","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Mehta, Deep Pankajbhai","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5122169850"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.7608000040054321,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.7608000040054321,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.05570000037550926,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12520","display_name":"Psychology of Moral and Emotional Judgment","score":0.01889999955892563,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/forcing","display_name":"Forcing (mathematics)","score":0.5156999826431274},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.42309999465942383},{"id":"https://openalex.org/keywords/motivated-reasoning","display_name":"Motivated reasoning","score":0.3986000120639801},{"id":"https://openalex.org/keywords/causal-reasoning","display_name":"Causal reasoning","score":0.2718000113964081},{"id":"https://openalex.org/keywords/deception","display_name":"Deception","score":0.26759999990463257}],"concepts":[{"id":"https://openalex.org/C197115733","wikidata":"https://www.wikidata.org/wiki/Q1003136","display_name":"Forcing (mathematics)","level":2,"score":0.5156999826431274},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.49970000982284546},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4650000035762787},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.42309999465942383},{"id":"https://openalex.org/C2776325391","wikidata":"https://www.wikidata.org/wiki/Q6917865","display_name":"Motivated reasoning","level":3,"score":0.3986000120639801},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3961000144481659},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3734000027179718},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.361299991607666},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.2948000133037567},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.2718000113964081},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2687000036239624},{"id":"https://openalex.org/C2779267917","wikidata":"https://www.wikidata.org/wiki/Q170028","display_name":"Deception","level":2,"score":0.26759999990463257},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.25609999895095825}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.00830","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00830","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.00830","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00830","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"When":[0],"AI":[1,45,133],"systems":[2],"explain":[3],"their":[4,105],"reasoning":[5,134],"step-by-step,":[6],"practitioners":[7],"often":[8,122],"assume":[9],"these":[10],"explanations":[11],"reveal":[12],"what":[13],"actually":[14],"influenced":[15],"the":[16],"AI's":[17],"answer.":[18],"We":[19,107],"tested":[20],"this":[21],"assumption":[22],"by":[23],"embedding":[24],"hints":[25,56,91,98,111],"into":[26],"questions":[27],"and":[28,103],"measuring":[29],"whether":[30],"models":[31,52,68,79,88],"mentioned":[32],"them.":[33,65],"In":[34],"a":[35,49],"study":[36],"of":[37],"over":[38],"9,000":[39],"test":[40],"cases":[41],"across":[42],"11":[43],"leading":[44],"models,":[46],"we":[47],"found":[48,109],"troubling":[50],"pattern:":[51],"almost":[53],"never":[54],"mention":[55],"spontaneously,":[57],"yet":[58],"when":[59,100],"asked":[60],"directly,":[61],"they":[62,80],"admit":[63],"noticing":[64],"This":[66],"suggests":[67],"see":[69],"influential":[70],"information":[71],"but":[72,93],"choose":[73],"not":[74,85,136],"to":[75,89,96,113,138],"report":[76,90,97],"it.":[77],"Telling":[78],"are":[81,116],"being":[82],"watched":[83],"does":[84],"help.":[86],"Forcing":[87],"works,":[92],"causes":[94],"them":[95,120,125],"even":[99],"none":[101],"exist":[102],"reduces":[104],"accuracy.":[106],"also":[108],"that":[110,130],"appealing":[112],"user":[114],"preferences":[115],"especially":[117],"dangerous-models":[118],"follow":[119],"most":[121],"while":[123],"reporting":[124],"least.":[126],"These":[127],"findings":[128],"suggest":[129],"simply":[131],"watching":[132],"is":[135],"enough":[137],"catch":[139],"hidden":[140],"influences.":[141]},"counts_by_year":[],"updated_date":"2026-01-08T20:10:11.968330","created_date":"2026-01-08T00:00:00"}
