{"id":"https://openalex.org/W7161760015","doi":"https://doi.org/10.48550/arxiv.2605.20084","title":"BalanceRAG: Joint Risk Calibration for Cascaded Retrieval-Augmented Generation","display_name":"BalanceRAG: Joint Risk Calibration for Cascaded Retrieval-Augmented Generation","publication_year":2026,"publication_date":"2026-05-19","ids":{"openalex":"https://openalex.org/W7161760015","doi":"https://doi.org/10.48550/arxiv.2605.20084"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.20084","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20084","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.20084","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136611457","display_name":"Zijun Jia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia, Zijun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136508476","display_name":"Yuanchang Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Yuanchang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136594831","display_name":"Sen Jia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia, Sen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050585744","display_name":"Yiyao Qian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qian, Yiyao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064258138","display_name":"H. Q. Wang","orcid":"https://orcid.org/0009-0005-0307-1853"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Haoning","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136511835","display_name":"Baojie Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Baojie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108643233","display_name":"Tang Diyin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Diyin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026534062","display_name":"Jinsong Yu","orcid":"https://orcid.org/0000-0002-1998-6995"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Jinsong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136557780","display_name":"Zhiyuan Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhiyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9020000100135803,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9020000100135803,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.040800001472234726,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.00559999980032444,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/thresholding","display_name":"Thresholding","score":0.6718999743461609},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.519599974155426},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.5087000131607056},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.4668000042438507},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.46230000257492065},{"id":"https://openalex.org/keywords/graphical-display","display_name":"Graphical display","score":0.3296000063419342}],"concepts":[{"id":"https://openalex.org/C191178318","wikidata":"https://www.wikidata.org/wiki/Q2256906","display_name":"Thresholding","level":3,"score":0.6718999743461609},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6460000276565552},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.519599974155426},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.5087000131607056},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.4668000042438507},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.46230000257492065},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4546999931335449},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3499999940395355},{"id":"https://openalex.org/C2984927552","wikidata":"https://www.wikidata.org/wiki/Q845734","display_name":"Graphical display","level":2,"score":0.3296000063419342},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2777999937534332},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.2687999904155731}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.20084","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20084","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.20084","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20084","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"can":[4],"enhance":[5],"factuality":[6],"via":[7],"retrieval-augmented":[8],"generation":[9],"(RAG),":[10],"but":[11],"applying":[12],"RAG":[13,41],"to":[14,39,88,146,152],"every":[15],"query":[16,30],"is":[17,23,31,48,56],"unnecessary":[18,189],"when":[19,53],"the":[20,45,70,101,132,157],"model-only":[21],"answer":[22],"reliable.":[24],"This":[25,126],"motivates":[26],"cascaded":[27],"RAG:":[28],"each":[29,106],"first":[32],"handled":[33],"by":[34,64],"an":[35,110],"LLM-only":[36,79],"branch,":[37],"escalated":[38],"a":[40,93,114],"fallback":[42],"only":[43],"if":[44],"primary":[46],"branch":[47,55],"uncertain,":[49],"and":[50,80,117,182,187],"abstained":[51],"from":[52,100],"neither":[54],"sufficiently":[57],"trustworthy.":[58],"However,":[59],"calibrating":[60],"such":[61],"cascades":[62],"stage":[63,65],"may":[66],"be":[67,153],"conservative,":[68],"since":[69],"final":[71],"utility":[72],"depends":[73],"on":[74,113,161],"joint":[75],"uncertainty":[76,98],"thresholding":[77],"of":[78],"RAG.":[81,195],"In":[82],"this":[83],"work,":[84],"we":[85],"develop":[86],"BalanceRAG":[87,104,144,174],"certify":[89],"threshold":[90,107,129],"pairs":[91],"at":[92],"target":[94],"risk":[95,177],"level.":[96],"Given":[97],"scores":[99],"two":[102],"branches,":[103],"frames":[105],"pair":[108],"as":[109],"operating":[111,120],"point":[112],"two-dimensional":[115],"lattice":[116],"identifies":[118],"safe":[119],"points":[121],"using":[122],"sequential":[123],"graphical":[124],"testing.":[125],"enables":[127],"risk-adaptive":[128],"calibration,":[130,148],"controlling":[131],"system-level":[133],"error":[134],"rate":[135],"among":[136],"accepted":[137,184],"points,":[138],"while":[139],"retaining":[140],"more":[141,183],"examples.":[142],"Furthermore,":[143],"extends":[145],"multi-risk":[147],"allowing":[149],"retrieval":[150,190],"usage":[151],"bounded":[154],"together":[155],"with":[156,193],"selection-conditioned":[158],"risk.":[159],"Experiments":[160],"three":[162],"open-domain":[163],"question":[164],"answering":[165],"(QA)":[166],"benchmarks":[167],"across":[168],"multiple":[169],"LLM":[170],"backbones":[171],"demonstrate":[172],"that":[173],"meets":[175],"prescribed":[176],"levels,":[178],"preserves":[179],"higher":[180],"coverage":[181],"correct":[185],"examples,":[186],"reduces":[188],"calls":[191],"compared":[192],"always-on":[194]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-21T00:00:00"}
