{"id":"https://openalex.org/W7161864463","doi":"https://doi.org/10.48550/arxiv.2605.18812","title":"PASC: Pipeline-Aware Conformal Prediction with Joint Coverage Guarantees for Multi-Stage NLP and LLM Pipelines","display_name":"PASC: Pipeline-Aware Conformal Prediction with Joint Coverage Guarantees for Multi-Stage NLP and LLM Pipelines","publication_year":2026,"publication_date":"2026-05-12","ids":{"openalex":"https://openalex.org/W7161864463","doi":"https://doi.org/10.48550/arxiv.2605.18812"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.18812","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18812","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.18812","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5095886522","display_name":"Varun Kotte","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kotte, Varun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":["https://openalex.org/A5095886522"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.7781999707221985,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.7781999707221985,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.061000000685453415,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.03229999914765358,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5853000283241272},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.527400016784668},{"id":"https://openalex.org/keywords/quantile","display_name":"Quantile","score":0.4779999852180481},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.47699999809265137},{"id":"https://openalex.org/keywords/joint-probability-distribution","display_name":"Joint probability distribution","score":0.47099998593330383},{"id":"https://openalex.org/keywords/bonferroni-correction","display_name":"Bonferroni correction","score":0.38679999113082886},{"id":"https://openalex.org/keywords/upper-and-lower-bounds","display_name":"Upper and lower bounds","score":0.3589000105857849},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.32440000772476196},{"id":"https://openalex.org/keywords/dice","display_name":"Dice","score":0.32100000977516174}],"concepts":[{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5853000283241272},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5314000248908997},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.527400016784668},{"id":"https://openalex.org/C118671147","wikidata":"https://www.wikidata.org/wiki/Q578714","display_name":"Quantile","level":2,"score":0.4779999852180481},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.47699999809265137},{"id":"https://openalex.org/C18653775","wikidata":"https://www.wikidata.org/wiki/Q1333358","display_name":"Joint probability distribution","level":2,"score":0.47099998593330383},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4643999934196472},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.39590001106262207},{"id":"https://openalex.org/C127808970","wikidata":"https://www.wikidata.org/wiki/Q385989","display_name":"Bonferroni correction","level":2,"score":0.38679999113082886},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.3589000105857849},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35030001401901245},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.32440000772476196},{"id":"https://openalex.org/C22029948","wikidata":"https://www.wikidata.org/wiki/Q45089","display_name":"Dice","level":2,"score":0.32100000977516174},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.31459999084472656},{"id":"https://openalex.org/C203519979","wikidata":"https://www.wikidata.org/wiki/Q865360","display_name":"Jaccard index","level":3,"score":0.31349998712539673},{"id":"https://openalex.org/C17020691","wikidata":"https://www.wikidata.org/wiki/Q139677","display_name":"Operator (biology)","level":5,"score":0.3131999969482422},{"id":"https://openalex.org/C178621042","wikidata":"https://www.wikidata.org/wiki/Q7631710","display_name":"Submodular set function","level":2,"score":0.31060001254081726},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.30649998784065247},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.3052999973297119},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.30230000615119934},{"id":"https://openalex.org/C2778220771","wikidata":"https://www.wikidata.org/wiki/Q1522579","display_name":"Substitution (logic)","level":2,"score":0.2939000129699707},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2921000123023987},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.28540000319480896},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.28439998626708984},{"id":"https://openalex.org/C98214594","wikidata":"https://www.wikidata.org/wiki/Q850275","display_name":"Conformal map","level":2,"score":0.2815999984741211},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27480000257492065},{"id":"https://openalex.org/C134121241","wikidata":"https://www.wikidata.org/wiki/Q899301","display_name":"Yield (engineering)","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25780001282691956},{"id":"https://openalex.org/C57691317","wikidata":"https://www.wikidata.org/wiki/Q1289248","display_name":"Scalar (mathematics)","level":2,"score":0.25519999861717224}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.18812","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18812","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.18812","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18812","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Modern":[0],"NLP":[1],"and":[2,23,103,132,150,182,207],"LLM":[3,205],"systems":[4,206],"are":[5,93],"pipelines:":[6],"named":[7],"entity":[8,12,16],"recognition":[9],"(NER)":[10],"-&gt;":[11,15,21,28,30,116,118],"disambiguation":[13],"(NED)":[14],"typing,":[17],"retrieval-augmented":[18],"generation":[19],"(retriever":[20],"reader),":[22],"agentic":[24],"chains":[25],"of":[26],"planner":[27],"tool":[29],"critic.":[31],"Errors":[32],"compound":[33,204],"across":[34],"stages,":[35],"but":[36,57],"existing":[37],"uncertainty":[38],"quantification":[39],"methods":[40],"either":[41],"calibrate":[42],"each":[43],"stage":[44],"independently":[45],"(no":[46],"joint":[47,68,79],"coverage)":[48],"or":[49],"apply":[50],"a":[51,71,85,109,113,173],"Bonferroni":[52,131],"union":[53],"bound":[54],"(joint":[55],"coverage,":[56],"conservative).":[58],"We":[59],"present":[60],"PASC":[61,83,123,154,171],"(Pipeline-Aware":[62],"Split":[63],"Conformal),":[64],"which":[65],"reduces":[66],"multi-stage":[67],"coverage":[69,127,159],"to":[70,108,147,169,184,193,203],"single":[72,174],"scalar":[73],"conformal":[74],"prediction":[75,140],"problem":[76],"on":[77],"the":[78,157,161],"maximum":[80],"nonconformity":[81],"score.":[82],"provides":[84],"finite-sample":[86],"distribution-free":[87],"guarantee":[88],"that":[89],"all":[90],"K":[91,185],"stages":[92,188],"simultaneously":[94],"covered":[95],"with":[96],"probability":[97],"at":[98,137],"least":[99],"1":[100],"-":[101],"alpha,":[102],"is":[104],"nearly":[105],"tight":[106],"up":[107],"1/(n+1)":[110],"factor.":[111],"On":[112],"three-stage":[114],"NER":[115],"NED":[117],"entity-typing":[119],"pipeline":[120],"over":[121],"CoNLL-2003,":[122],"achieves":[124],"96.4%":[125],"end-to-end":[126,195],"versus":[128],"93.4%":[129],"for":[130,134],"86.5%":[133],"independent":[135,166,190],"CP,":[136],"identical":[138],"average":[139],"set":[141],"size":[142],"(1.083).":[143],"Under":[144],"distribution":[145],"shift":[146,163],"WNUT-17":[148],"Twitter":[149],"WikiNEuRal":[151],"Wikipedia":[152],"data,":[153],"empirically":[155],"maintains":[156],"target":[158],"in":[160],"tested":[162],"settings":[164],"while":[165],"CP":[167,191],"collapses":[168],"59%.":[170],"requires":[172],"quantile":[175],"computation,":[176],"runs":[177],"1.7x":[178],"faster":[179],"than":[180],"Bonferroni,":[181],"scales":[183],"=":[186],"6":[187],"where":[189],"drops":[192],"0.53":[194],"coverage.":[196],"The":[197],"same":[198],"joint-maximum-score":[199],"reduction":[200],"applies":[201],"directly":[202],"agent":[208],"pipelines.":[209]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-21T00:00:00"}
