{"id":"https://openalex.org/W7161829213","doi":"https://doi.org/10.48550/arxiv.2605.18871","title":"Distributional Energy-Based Models for Uncertainty-Aware Structured LLM Reasoning","display_name":"Distributional Energy-Based Models for Uncertainty-Aware Structured LLM Reasoning","publication_year":2026,"publication_date":"2026-05-15","ids":{"openalex":"https://openalex.org/W7161829213","doi":"https://doi.org/10.48550/arxiv.2605.18871"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.18871","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18871","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.18871","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000669621","display_name":"Shireen Kudukkil Manchingal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manchingal, Shireen Kudukkil","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136586968","display_name":"Abhey Kalia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kalia, Abhey","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136525250","display_name":"Fernanda Gon\u00e7alves","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gon\u00e7alves, Fernanda","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136579503","display_name":"Shebin Rawther","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rawther, Shebin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4869000017642975,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4869000017642975,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.14659999310970306,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.033399999141693115,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5932000279426575},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.5608999729156494},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5511999726295471},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.5321000218391418},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4828000068664551},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.48249998688697815},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.4544000029563904},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4343000054359436}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7570000290870667},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5932000279426575},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.5608999729156494},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5511999726295471},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.5321000218391418},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4828000068664551},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.48249998688697815},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45590001344680786},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.4544000029563904},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4343000054359436},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.39730000495910645},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33250001072883606},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33180001378059387},{"id":"https://openalex.org/C2779346075","wikidata":"https://www.wikidata.org/wiki/Q7268763","display_name":"Quality Score","level":3,"score":0.32260000705718994},{"id":"https://openalex.org/C63002673","wikidata":"https://www.wikidata.org/wiki/Q2260590","display_name":"Scoring rule","level":2,"score":0.31119999289512634},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.30320000648498535},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.30079999566078186},{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.3000999987125397},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.2879999876022339},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.28679999709129333},{"id":"https://openalex.org/C162376815","wikidata":"https://www.wikidata.org/wiki/Q2158281","display_name":"Frequentist inference","level":4,"score":0.28299999237060547},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.26739999651908875}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.18871","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18871","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.18871","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18871","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.63431316614151,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"When":[0],"Large":[1],"Language":[2],"Models":[3],"produce":[4],"structured":[5,56],"outputs":[6],"such":[7],"as":[8,25],"travel":[9],"plans,":[10],"code":[11,181],"solutions,":[12],"or":[13,33,98],"multi-step":[14],"proofs,":[15],"individual":[16],"reasoning":[17,193],"steps":[18],"may":[19],"appear":[20],"correct":[21],"while":[22,82,171],"the":[23,77,83],"output":[24],"a":[26,39,45,63,70,90,114,197,213,222],"whole":[27],"violates":[28],"budgets,":[29],"fails":[30],"test":[31],"cases,":[32],"contradicts":[34],"earlier":[35],"deductions.":[36],"We":[37],"propose":[38],"decomposed":[40],"energy":[41],"function":[42],"that":[43,94],"combines":[44],"learned":[46],"quality":[47,60,189],"scorer":[48,61,215],"with":[49],"deterministic":[50],"analytical":[51],"constraint":[52,137],"penalties":[53],"for":[54],"verifying":[55],"LLM":[57],"outputs.":[58],"The":[59,151],"is":[62],"heterogeneous":[64],"ensemble":[65,78],"of":[66,116],"low-rank":[67],"adapters":[68],"on":[69,123,130,145,191,200,208,218],"single":[71],"frozen":[72],"encoder":[73],"(3%":[74],"trainable":[75],"parameters);":[76],"mean":[79],"ranks":[80],"candidates":[81],"standard":[84],"deviation":[85],"quantifies":[86],"epistemic":[87],"uncertainty,":[88],"driving":[89],"two-pass":[91],"inference":[92],"loop":[93],"triggers":[95],"targeted":[96],"regeneration":[97],"abstention.":[99],"Across":[100],"five":[101],"benchmarks":[102],"(GSM8K,":[103],"MuSR,":[104],"TravelPlanner,":[105],"TACO,":[106],"Knights":[107],"&amp;":[108],"Knaves),":[109],"our":[110],"149M-parameter":[111],"verifier":[112,164],"orchestrating":[113],"pool":[115],"7-26B":[117],"open":[118],"generators":[119],"outperforms":[120],"single-shot":[121],"Qwen-72B":[122],"every":[124],"benchmark,":[125],"matches":[126],"Claude":[127],"Sonnet":[128],"4.6":[129,144],"MuSR":[131],"(67.7%":[132],"vs.":[133],"68.0%),":[134],"and":[135,195],"reduces":[136],"violations":[138],"by":[139],"53%":[140],"relative":[141],"to":[142],"Opus":[143],"TravelPlanner":[146],"(oracle":[147],"0.028,":[148],"random":[149],"0.231).":[150],"two":[152],"routes":[153],"are":[154,161,177],"complementary:":[155],"structural":[156],"verification":[157],"wins":[158],"when":[159],"constraints":[160],"checkable":[162],"(the":[163],"captures":[165],"signal":[166],"frontier":[167],"models":[168],"cannot":[169],"self-detect),":[170],"pretraining-scale":[172],"priors":[173],"win":[174],"where":[175],"they":[176],"not":[178],"(narrative":[179],"inference,":[180],"semantics).":[182],"A":[183],"cross-dataset":[184],"confounding":[185],"analysis":[186],"confirms":[187],"genuine":[188],"discrimination":[190],"four":[192],"tasks":[194],"identifies":[196],"model-identity":[198],"shortcut":[199],"code,":[201],"mitigated":[202],"via":[203],"last-layer":[204],"retraining.":[205],"Scorers":[206],"trained":[207],"difficult":[209],"data":[210],"transfer":[211],"zero-shot:":[212],"MuSR-trained":[214],"achieves":[216],"93.9%":[217],"GSM8K":[219],"without":[220],"seeing":[221],"math":[223],"problem.":[224]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-21T00:00:00"}
