{"id":"https://openalex.org/W7152605534","doi":"https://doi.org/10.48550/arxiv.2604.07036","title":"ReDAct: Uncertainty-Aware Deferral for LLM Agents","display_name":"ReDAct: Uncertainty-Aware Deferral for LLM Agents","publication_year":2026,"publication_date":"2026-04-08","ids":{"openalex":"https://openalex.org/W7152605534","doi":"https://doi.org/10.48550/arxiv.2604.07036"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.07036","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07036","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.07036","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133264365","display_name":"Dzianis Piatrashyn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Piatrashyn, Dzianis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070122910","display_name":"Nikita Kotelevskii","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kotelevskii, Nikita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5117017643","display_name":"Kirill Grishchenkov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Grishchenkov, Kirill","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133272379","display_name":"Nikita Glazkov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Glazkov, Nikita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133289054","display_name":"Ivan Nasonov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nasonov, Ivan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074238659","display_name":"Ilya Makarov","orcid":"https://orcid.org/0000-0002-3308-8825"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Makarov, Ilya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133295396","display_name":"Timothy Baldwin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baldwin, Timothy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133246428","display_name":"Preslav Nakov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nakov, Preslav","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046928528","display_name":"Roman Vashurin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vashurin, Roman","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133305861","display_name":"Maxim Panov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Panov, Maxim","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.6086999773979187,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.6086999773979187,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.04560000076889992,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.03220000118017197,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/deferral","display_name":"Deferral","score":0.675000011920929},{"id":"https://openalex.org/keywords/mistake","display_name":"Mistake","score":0.6251999735832214},{"id":"https://openalex.org/keywords/hallucinating","display_name":"Hallucinating","score":0.5353999733924866},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5249000191688538},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.42669999599456787}],"concepts":[{"id":"https://openalex.org/C2778281098","wikidata":"https://www.wikidata.org/wiki/Q885383","display_name":"Deferral","level":2,"score":0.675000011920929},{"id":"https://openalex.org/C2777179996","wikidata":"https://www.wikidata.org/wiki/Q911222","display_name":"Mistake","level":2,"score":0.6251999735832214},{"id":"https://openalex.org/C2911011789","wikidata":"https://www.wikidata.org/wiki/Q130741","display_name":"Hallucinating","level":2,"score":0.5353999733924866},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5249000191688538},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.4957999885082245},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.42669999599456787},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.41990000009536743},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.4147000014781952},{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.4041000008583069},{"id":"https://openalex.org/C162118730","wikidata":"https://www.wikidata.org/wiki/Q1128453","display_name":"Actuarial science","level":1,"score":0.33559998869895935},{"id":"https://openalex.org/C195487862","wikidata":"https://www.wikidata.org/wiki/Q850210","display_name":"Revenue","level":2,"score":0.2818000018596649},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.2799000144004822},{"id":"https://openalex.org/C177713679","wikidata":"https://www.wikidata.org/wiki/Q679690","display_name":"Intensive care medicine","level":1,"score":0.26649999618530273},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.07036","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07036","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.07036","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07036","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.8245317339897156,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recently,":[0],"LLM-based":[1],"agents":[2],"have":[3],"become":[4],"increasingly":[5],"popular":[6],"across":[7],"many":[8],"applications,":[9],"including":[10],"complex":[11],"sequential":[12,29],"decision-making":[13],"problems.":[14],"However,":[15],"they":[16,51],"inherit":[17],"the":[18,38,94,98,105,110,136,141],"tendency":[19],"of":[20,97,133,143],"LLMs":[21,48],"to":[22,25,109,135],"hallucinate,":[23],"leading":[24],"incorrect":[26],"decisions.":[27],"In":[28,58,69],"settings,":[30],"even":[31,43],"a":[32,53,78,86,102],"single":[33],"mistake":[34],"can":[35,139],"irreversibly":[36],"degrade":[37],"trajectory,":[39],"making":[40],"hallucinations":[41],"an":[42,71],"bigger":[44],"problem.":[45],"Although":[46],"larger":[47],"hallucinate":[49],"less,":[50],"incur":[52],"significantly":[54,148],"higher":[55],"per-token":[56],"cost.":[57],"this":[59,63],"paper,":[60],"we":[61],"address":[62],"tradeoff":[64],"by":[65,83],"proposing":[66],"ReDAct":[67],"(Reason-Defer-Act).":[68],"ReDAct,":[70],"agent":[72],"is":[73,107],"equipped":[74],"with":[75],"two":[76],"LLMs:":[77],"small,":[79],"cheap":[80],"model":[81,100,138],"used":[82],"default,":[84],"and":[85,124,126],"large,":[87],"more":[88],"reliable":[89],"but":[90],"expensive":[91],"model.":[92,112],"When":[93],"predictive":[95],"uncertainty":[96],"small":[99],"exceeds":[101],"calibrated":[103],"threshold,":[104],"decision":[106],"deferred":[108],"large":[111,137],"We":[113],"evaluate":[114],"our":[115],"approach":[116],"in":[117],"text-based":[118],"embodied":[119],"environments":[120],"such":[121],"as":[122],"ALFWorld":[123],"MiniGrid":[125],"show":[127],"that":[128],"deferring":[129],"only":[130],"about":[131],"15%":[132],"decisions":[134],"match":[140],"quality":[142],"using":[144],"it":[145],"exclusively,":[146],"while":[147],"reducing":[149],"inference":[150],"costs.":[151]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-10T00:00:00"}
