{"id":"https://openalex.org/W7127116451","doi":"https://doi.org/10.48550/arxiv.2601.23133","title":"RAudit: A Blind Auditing Protocol for Large Language Model Reasoning","display_name":"RAudit: A Blind Auditing Protocol for Large Language Model Reasoning","publication_year":2026,"publication_date":"2026-01-30","ids":{"openalex":"https://openalex.org/W7127116451","doi":"https://doi.org/10.48550/arxiv.2601.23133"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2601.23133","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124856665","display_name":"Edward Y. Chang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chang, Edward Y.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5124865968","display_name":"Longling Geng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Geng, Longling","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5124856665"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.2994999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.2994999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.195700004696846,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.050200000405311584,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/competence","display_name":"Competence (human resources)","score":0.6251999735832214},{"id":"https://openalex.org/keywords/audit","display_name":"Audit","score":0.5627999901771545},{"id":"https://openalex.org/keywords/framing","display_name":"Framing (construction)","score":0.4577000141143799},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.41600000858306885},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.3885999917984009},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.3682999908924103},{"id":"https://openalex.org/keywords/mathematical-proof","display_name":"Mathematical proof","score":0.35019999742507935},{"id":"https://openalex.org/keywords/framing-effect","display_name":"Framing effect","score":0.3456999957561493}],"concepts":[{"id":"https://openalex.org/C100521375","wikidata":"https://www.wikidata.org/wiki/Q2015382","display_name":"Competence (human resources)","level":2,"score":0.6251999735832214},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5695000290870667},{"id":"https://openalex.org/C199521495","wikidata":"https://www.wikidata.org/wiki/Q181487","display_name":"Audit","level":2,"score":0.5627999901771545},{"id":"https://openalex.org/C169087156","wikidata":"https://www.wikidata.org/wiki/Q2131593","display_name":"Framing (construction)","level":2,"score":0.4577000141143799},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.44920000433921814},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.41600000858306885},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4050999879837036},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.38940000534057617},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3885999917984009},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.3682999908924103},{"id":"https://openalex.org/C108710211","wikidata":"https://www.wikidata.org/wiki/Q11538","display_name":"Mathematical proof","level":2,"score":0.35019999742507935},{"id":"https://openalex.org/C136714292","wikidata":"https://www.wikidata.org/wiki/Q1440683","display_name":"Framing effect","level":3,"score":0.3456999957561493},{"id":"https://openalex.org/C11671645","wikidata":"https://www.wikidata.org/wiki/Q5054567","display_name":"Causal model","level":2,"score":0.33809998631477356},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.3230000138282776},{"id":"https://openalex.org/C133112747","wikidata":"https://www.wikidata.org/wiki/Q7251931","display_name":"Protocol analysis","level":2,"score":0.3149999976158142},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.31119999289512634},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.29899999499320984},{"id":"https://openalex.org/C25148115","wikidata":"https://www.wikidata.org/wiki/Q304904","display_name":"Social competence","level":3,"score":0.26030001044273376},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C2775907273","wikidata":"https://www.wikidata.org/wiki/Q7805281","display_name":"Time constraint","level":2,"score":0.2565000057220459},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.25220000743865967},{"id":"https://openalex.org/C193221554","wikidata":"https://www.wikidata.org/wiki/Q5153664","display_name":"Commonsense reasoning","level":2,"score":0.25209999084472656}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2601.23133","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2601.23133","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.23133","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2601.23133","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Inference-time":[0],"scaling":[1],"can":[2],"amplify":[3],"reasoning":[4,21,82],"pathologies:":[5],"sycophancy,":[6],"rung":[7],"collapse,":[8],"and":[9,60,76,84,140,158],"premature":[10],"certainty.":[11],"We":[12,72],"present":[13],"RAudit,":[14],"a":[15],"diagnostic":[16],"protocol":[17],"for":[18],"auditing":[19],"LLM":[20],"without":[22],"ground":[23],"truth":[24],"access.":[25],"The":[26,110,124],"key":[27],"constraint":[28],"is":[29],"blindness:":[30],"the":[31],"auditor":[32],"evaluates":[33],"only":[34],"whether":[35],"derivation":[36],"steps":[37],"support":[38],"conclusions,":[39],"enabling":[40],"detection":[41],"of":[42],"trace-output":[43],"inconsistency":[44],"and,":[45],"when":[46],"latent":[47],"competence":[48],"exists,":[49],"its":[50],"recovery.":[51],"RAudit":[52],"measures":[53],"process":[54],"quality":[55],"via":[56],"CRIT-based":[57],"reasonableness":[58],"scores":[59],"varies":[61],"critique":[62],"formulation":[63],"to":[64],"study":[65],"how":[66],"social":[67,107],"framing":[68],"affects":[69],"model":[70,92],"response.":[71],"prove":[73],"bounded":[74],"correction":[75,146],"$O(\\log(1/\u03b5))$":[77],"termination.":[78],"Experiments":[79],"on":[80],"mathematical":[81,138],"(CAP-GSM8K)":[83],"causal":[85,128],"judgment":[86],"(CausalL2)":[87],"reveal":[88],"four":[89],"mechanisms":[90],"explaining":[91],"unreliability:":[93],"(1)":[94],"Latent":[95],"Competence":[96,112],"Suppression,":[97],"where":[98,114,127,144],"models":[99],"derive":[100],"correct":[101],"answers":[102],"then":[103],"overwrite":[104],"them":[105],"under":[106],"pressure;":[108],"(2)":[109],"False":[111],"Trap,":[113],"weaker":[115,148],"judges":[116,121],"mask":[117],"sycophancy":[118,136],"that":[119,154,159],"stronger":[120,160],"expose;":[122],"(3)":[123],"Complexity-Vulnerability":[125],"Tradeoff,":[126],"tasks":[129],"induce":[130],"more":[131],"than":[132,137],"10":[133],"times":[134],"higher":[135],"tasks;":[139],"(4)":[141],"Iatrogenic":[142],"Critique,":[143],"authoritative":[145],"harms":[147],"models.":[149],"These":[150],"findings":[151],"challenge":[152],"assumptions":[153],"capability":[155],"implies":[156],"robustness":[157],"feedback":[161],"yields":[162],"better":[163],"outputs.":[164]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-03T00:00:00"}
