{"id":"https://openalex.org/W7147370540","doi":"https://doi.org/10.48550/arxiv.2603.27403","title":"Conditional Factuality Controlled LLMs with Generalization Certificates via Conformal Sampling","display_name":"Conditional Factuality Controlled LLMs with Generalization Certificates via Conformal Sampling","publication_year":2026,"publication_date":"2026-03-28","ids":{"openalex":"https://openalex.org/W7147370540","doi":"https://doi.org/10.48550/arxiv.2603.27403"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.27403","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27403","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.27403","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132642863","display_name":"Kai Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Kai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003242041","display_name":"Qingtao Pan","orcid":"https://orcid.org/0000-0002-5247-9469"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Qingtao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132690717","display_name":"Shuo Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Shuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.2734000086784363,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.2734000086784363,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.15600000321865082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.1371999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6840000152587891},{"id":"https://openalex.org/keywords/certificate","display_name":"Certificate","score":0.6377999782562256},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5945000052452087},{"id":"https://openalex.org/keywords/quantile","display_name":"Quantile","score":0.5766000151634216},{"id":"https://openalex.org/keywords/conformal-map","display_name":"Conformal map","score":0.5230000019073486},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.454800009727478},{"id":"https://openalex.org/keywords/conditional-expectation","display_name":"Conditional expectation","score":0.38940000534057617}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6840000152587891},{"id":"https://openalex.org/C96865113","wikidata":"https://www.wikidata.org/wiki/Q2946816","display_name":"Certificate","level":2,"score":0.6377999782562256},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5945000052452087},{"id":"https://openalex.org/C118671147","wikidata":"https://www.wikidata.org/wiki/Q578714","display_name":"Quantile","level":2,"score":0.5766000151634216},{"id":"https://openalex.org/C98214594","wikidata":"https://www.wikidata.org/wiki/Q850275","display_name":"Conformal map","level":2,"score":0.5230000019073486},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4722999930381775},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4715999960899353},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.454800009727478},{"id":"https://openalex.org/C186215838","wikidata":"https://www.wikidata.org/wiki/Q772232","display_name":"Conditional expectation","level":2,"score":0.38940000534057617},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.3637999892234802},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.35499998927116394},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.34950000047683716},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.34130001068115234},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.33820000290870667},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.33739998936653137},{"id":"https://openalex.org/C43555835","wikidata":"https://www.wikidata.org/wiki/Q2300258","display_name":"Conditional probability distribution","level":2,"score":0.3361999988555908},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.31369999051094055},{"id":"https://openalex.org/C44492722","wikidata":"https://www.wikidata.org/wiki/Q327069","display_name":"Conditional probability","level":2,"score":0.2924000024795532},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.28949999809265137},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2883000075817108},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.26969999074935913},{"id":"https://openalex.org/C161584116","wikidata":"https://www.wikidata.org/wiki/Q1952580","display_name":"Multivariate statistics","level":2,"score":0.25360000133514404}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.27403","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27403","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.27403","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27403","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"need":[4],"reliable":[5],"test-time":[6],"control":[7],"of":[8],"hallucinations.":[9],"Existing":[10],"conformal":[11,48,119],"methods":[12],"for":[13],"LLMs":[14],"typically":[15],"provide":[16],"only":[17],"\\emph{marginal}":[18],"guarantees":[19],"and":[20,35,74,97,166,169,175,191],"rely":[21],"on":[22,69,106,140,161],"a":[23,46,60,70,78,91,129,141,145,170],"single":[24],"global":[25],"threshold,":[26],"which":[27,133],"can":[28],"under-cover":[29],"hard":[30],"prompts,":[31],"over-cover":[32],"easy":[33],"ones,":[34],"produce":[36],"oversized":[37],"prediction":[38,120,187],"sets.":[39],"We":[40,126],"propose":[41],"\\emph{Conditional":[42],"Factuality":[43],"Control}":[44],"(CFC),":[45],"post-hoc":[47],"framework":[49],"that":[50,88,148],"returns":[51],"\\emph{set-valued}":[52],"outputs":[53],"with":[54],"\\emph{conditional}":[55],"coverage":[56,93,180],"guarantees.":[57],"CFC":[58,89,174],"defines":[59],"continuous,":[61],"feature-conditional":[62],"acceptance":[63],"threshold":[64,80],"through":[65,77],"augmented":[66],"quantile":[67],"regression":[68],"latent":[71],"``success''":[72],"score,":[73],"deploys":[75],"it":[76],"fixed-point":[79],"rule":[81,112],"at":[82,121,157],"inference":[83],"time.":[84],"Theoretically,":[85],"we":[86],"show":[87],"satisfies":[90],"conditional":[92,111,150],"guarantee":[94],"under":[95,103],"exchangeability":[96],"analyze":[98],"its":[99],"\\emph{efficiency},":[100],"proving":[101],"that,":[102],"mild":[104],"assumptions":[105],"the":[107,110,122,135,149,154],"score":[108],"distributions,":[109],"is":[113],"strictly":[114],"more":[115],"sample-efficient":[116],"than":[117,189],"marginal":[118],"same":[123],"target":[124,155],"coverage.":[125],"further":[127],"derive":[128],"PAC-style":[130],"variant,":[131],"CFC-PAC,":[132],"shrinks":[134],"nominal":[136],"risk":[137],"level":[138],"based":[139],"stability":[142],"bound,":[143],"yielding":[144],"finite-sample":[146],"certificate":[147],"miscoverage":[151],"deviates":[152],"from":[153],"by":[156],"most":[158],"$O(\\sqrt{\\log(1/\u03b4)/N})$.":[159],"Empirically,":[160],"synthetic":[162],"data,":[163],"real-world":[164],"reasoning":[165],"QA":[167],"benchmarks,":[168],"Flickr8k":[171],"VLM":[172],"setting,":[173],"CFC-PAC":[176],"consistently":[177],"attain":[178],"near-target":[179],"across":[181],"difficulty":[182],"groups":[183],"while":[184],"using":[185],"smaller":[186],"sets":[188],"CP":[190],"non-CP":[192],"baselines.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-02T00:00:00"}
