{"id":"https://openalex.org/W7161754815","doi":"https://doi.org/10.48550/arxiv.2605.19220","title":"Position: Uncertainty Quantification in LLMs is Just Unsupervised Clustering","display_name":"Position: Uncertainty Quantification in LLMs is Just Unsupervised Clustering","publication_year":2026,"publication_date":"2026-05-19","ids":{"openalex":"https://openalex.org/W7161754815","doi":"https://doi.org/10.48550/arxiv.2605.19220"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.19220","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.19220","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.19220","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136574811","display_name":"Tiejin Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Tiejin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074815612","display_name":"Longchao Da","orcid":"https://orcid.org/0009-0000-8631-9634"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Da, Longchao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136598861","display_name":"Xiaoou Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiaoou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136601533","display_name":"Hua Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Hua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.1509000062942505,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.1509000062942505,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1492999941110611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.11680000275373459,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/proxy","display_name":"Proxy (statistics)","score":0.6381000280380249},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5590000152587891},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.527999997138977},{"id":"https://openalex.org/keywords/overconfidence-effect","display_name":"Overconfidence effect","score":0.46869999170303345},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.45190000534057617},{"id":"https://openalex.org/keywords/uncertainty-quantification","display_name":"Uncertainty quantification","score":0.38089999556541443},{"id":"https://openalex.org/keywords/credibility","display_name":"Credibility","score":0.36640000343322754},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.3490000069141388}],"concepts":[{"id":"https://openalex.org/C2780148112","wikidata":"https://www.wikidata.org/wiki/Q1432581","display_name":"Proxy (statistics)","level":2,"score":0.6381000280380249},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6270999908447266},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5590000152587891},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.527999997138977},{"id":"https://openalex.org/C51110983","wikidata":"https://www.wikidata.org/wiki/Q16503490","display_name":"Overconfidence effect","level":2,"score":0.46869999170303345},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.45190000534057617},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42500001192092896},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39559999108314514},{"id":"https://openalex.org/C32230216","wikidata":"https://www.wikidata.org/wiki/Q7882499","display_name":"Uncertainty quantification","level":2,"score":0.38089999556541443},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3790999948978424},{"id":"https://openalex.org/C2780224610","wikidata":"https://www.wikidata.org/wiki/Q1530061","display_name":"Credibility","level":2,"score":0.36640000343322754},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.3490000069141388},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.34700000286102295},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3257000148296356},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.3084999918937683},{"id":"https://openalex.org/C2780771206","wikidata":"https://www.wikidata.org/wiki/Q3271761","display_name":"Safeguard","level":2,"score":0.3003999888896942},{"id":"https://openalex.org/C37381756","wikidata":"https://www.wikidata.org/wiki/Q20203288","display_name":"Representativeness heuristic","level":2,"score":0.289900004863739},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.2874000072479248},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.28450000286102295},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.2669000029563904},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.2637999951839447}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.19220","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.19220","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.19220","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.19220","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.6830781102180481}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Uncertainty":[0],"Quantification":[1],"(UQ)":[2],"is":[3],"widely":[4],"regarded":[5],"as":[6,195],"the":[7,23,48,52,86,99,168],"primary":[8],"safeguard":[9],"for":[10,33,157,167,181,199],"deploying":[11,98],"Large":[12],"Language":[13],"Models":[14],"(LLMs)":[15],"in":[16,80,187],"high-stakes":[17],"domains.":[18],"However,":[19],"we":[20,105,155],"argue":[21],"that":[22,42,121,129,141,191],"field":[24],"suffers":[25],"from":[26,111],"a":[27,92,117,135,158,165,196],"category":[28],"error:":[29],"mainstream":[30],"UQ":[31,88,162],"methods":[32,62,89],"LLMs":[34],"are":[35,63],"just":[36],"unsupervised":[37],"clustering":[38],"algorithms.":[39],"We":[40],"demonstrate":[41],"most":[43],"current":[44,61,87],"approaches":[45],"inherently":[46],"quantify":[47],"internal":[49,115,126],"consistency":[50],"of":[51,95,138],"model's":[53],"generations":[54],"rather":[55],"than":[56],"their":[57],"external":[58],"correctness.":[59],"Consequently,":[60],"fundamentally":[64],"blind":[65],"to":[66,71,148,161,171],"factual":[67],"reality":[68],"and":[69,134,163,176,184],"fail":[70],"detect":[72],"``confident":[73],"hallucinations,''":[74],"where":[75],"models":[76,100],"exhibit":[77],"high":[78],"confidence":[79,193],"stable":[81],"but":[82],"incorrect":[83],"answers.":[84],"Therefore,":[85],"may":[90],"create":[91],"deceptive":[93],"sense":[94],"safety":[96],"when":[97],"with":[101,132],"uncertainty.":[102,150],"In":[103],"detail,":[104],"identify":[106],"three":[107],"critical":[108],"pathologies":[109],"resulting":[110],"this":[112,153],"dependence":[113],"on":[114,144],"state:":[116],"hyperparameter":[118],"sensitivity":[119],"crisis":[120],"renders":[122],"deployment":[123],"unsafe,":[124],"an":[125],"evaluation":[127,174],"cycle":[128],"conflates":[130],"stability":[131],"truth,":[133,189],"fundamental":[136],"lack":[137],"ground":[139],"truth":[140],"forces":[142],"reliance":[143],"unstable":[145],"proxy":[146,198],"metrics":[147,175],"evaluate":[149],"To":[151],"resolve":[152],"impasse,":[154],"advocate":[156],"paradigm":[159],"shift":[160],"outline":[164],"roadmap":[166],"research":[169],"community":[170],"adopt":[172],"better":[173],"settings,":[177],"implement":[178],"mechanism":[179],"changes":[180],"native":[182],"uncertainty,":[183],"anchor":[185],"verification":[186],"objective":[188],"ensuring":[190],"model":[192],"serves":[194],"reliable":[197],"reality.":[200]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-21T00:00:00"}
