{"id":"https://openalex.org/W7154360903","doi":"https://doi.org/10.48550/arxiv.2604.11141","title":"Reducing Hallucination in Enterprise AI Workflows via Hybrid Utility Minimum Bayes Risk (HUMBR)","display_name":"Reducing Hallucination in Enterprise AI Workflows via Hybrid Utility Minimum Bayes Risk (HUMBR)","publication_year":2026,"publication_date":"2026-04-13","ids":{"openalex":"https://openalex.org/W7154360903","doi":"https://doi.org/10.48550/arxiv.2604.11141"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.11141","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.11141","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.11141","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133566664","display_name":"Chenhao Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Chenhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133572293","display_name":"Jordi Mola","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mola, Jordi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133609404","display_name":"Mark Harman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Harman, Mark","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133570406","display_name":"Jason Nawrocki","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nawrocki, Jason","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133561765","display_name":"Vaibhav Shrivastava","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shrivastava, Vaibhav","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133593304","display_name":"Yue Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Yue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133559094","display_name":"Jay Minesh Shah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shah, Jay Minesh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055869345","display_name":"Katayoun Zand","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zand, Katayoun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056749939","display_name":"Mansi Tripathi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tripathi, Mansi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114453068","display_name":"Arya Pudota","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pudota, Arya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133590729","display_name":"Matthew Becker","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Becker, Matthew","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133609105","display_name":"Herv\u00e9 Robert","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Robert, Herv\u00e9","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5077382409","display_name":"Abhishek Gulati","orcid":"https://orcid.org/0000-0002-4504-8898"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gulati, Abhishek","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10703","display_name":"Business Process Modeling and Analysis","score":0.1746000051498413,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10703","display_name":"Business Process Modeling and Analysis","score":0.1746000051498413,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.14229999482631683,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.12370000034570694,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.588699996471405},{"id":"https://openalex.org/keywords/bayes-theorem","display_name":"Bayes' theorem","score":0.5260999798774719},{"id":"https://openalex.org/keywords/hallucinating","display_name":"Hallucinating","score":0.3928999900817871},{"id":"https://openalex.org/keywords/framing","display_name":"Framing (construction)","score":0.39169999957084656},{"id":"https://openalex.org/keywords/complement","display_name":"Complement (music)","score":0.3538999855518341},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.353300005197525},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.35109999775886536},{"id":"https://openalex.org/keywords/empirical-research","display_name":"Empirical research","score":0.3395000100135803},{"id":"https://openalex.org/keywords/risk-assessment","display_name":"Risk assessment","score":0.31189998984336853}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6830999851226807},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.588699996471405},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.5260999798774719},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5228999853134155},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45249998569488525},{"id":"https://openalex.org/C2911011789","wikidata":"https://www.wikidata.org/wiki/Q130741","display_name":"Hallucinating","level":2,"score":0.3928999900817871},{"id":"https://openalex.org/C169087156","wikidata":"https://www.wikidata.org/wiki/Q2131593","display_name":"Framing (construction)","level":2,"score":0.39169999957084656},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.38839998841285706},{"id":"https://openalex.org/C112313634","wikidata":"https://www.wikidata.org/wiki/Q7886648","display_name":"Complement (music)","level":5,"score":0.3538999855518341},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.353300005197525},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.35109999775886536},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.3395000100135803},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3147999942302704},{"id":"https://openalex.org/C12174686","wikidata":"https://www.wikidata.org/wiki/Q1058438","display_name":"Risk assessment","level":2,"score":0.31189998984336853},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.3005000054836273},{"id":"https://openalex.org/C166052673","wikidata":"https://www.wikidata.org/wiki/Q83021","display_name":"Empirical evidence","level":2,"score":0.3003999888896942},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C108154423","wikidata":"https://www.wikidata.org/wiki/Q1469792","display_name":"Salience (neuroscience)","level":2,"score":0.2770000100135803},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.273499995470047},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2727000117301941},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C2776390805","wikidata":"https://www.wikidata.org/wiki/Q7258035","display_name":"Public use","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.2703000009059906},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.26489999890327454},{"id":"https://openalex.org/C32896092","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Risk management","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.26440000534057617},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.2567000091075897},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.25519999861717224},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.25450000166893005}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.11141","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.11141","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.11141","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.11141","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.4538971781730652,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Although":[0],"LLMs":[1],"drive":[2],"automation,":[3],"it":[4],"is":[5],"critical":[6,149],"to":[7,82],"ensure":[8],"immense":[9],"consideration":[10],"for":[11,88],"high-stakes":[12],"enterprise":[13],"workflows":[14,41],"such":[15,38],"as":[16,52],"those":[17],"involving":[18],"legal":[19],"matters,":[20],"risk":[21],"management,":[22],"and":[23,28,111,113,148],"privacy":[24],"compliance.":[25],"For":[26],"Meta,":[27],"other":[29],"organizations":[30],"like":[31],"ours,":[32],"a":[33,53,68,101],"single":[34],"hallucinated":[35],"clause":[36],"in":[37],"high":[39],"stakes":[40],"risks":[42],"material":[43],"consequences.":[44],"We":[45,95],"show":[46,128],"that":[47,74,129],"by":[48],"framing":[49],"hallucination":[50],"mitigation":[51],"Minimum":[54],"Bayes":[55],"Risk":[56],"(MBR)":[57],"problem,":[58],"we":[59,66,90],"can":[60],"dramatically":[61],"reduce":[62],"this":[63,97],"risk.":[64],"Specifically,":[65],"introduce":[67],"Hybrid":[69],"Utility":[70],"MBR":[71,130],"(HUMBR)":[72],"framework":[73],"synthesizes":[75],"semantic":[76],"embedding":[77],"similarity":[78],"with":[79,100],"lexical":[80],"precision":[81],"identify":[83],"consensus":[84],"without":[85],"ground-truth":[86],"references,":[87],"which":[89],"derive":[91],"rigorous":[92],"error":[93],"bounds.":[94],"complement":[96],"theoretical":[98],"analysis":[99],"comprehensive":[102],"empirical":[103,126],"evaluation":[104],"on":[105],"widely-used":[106],"public":[107],"benchmark":[108],"suites":[109],"(TruthfulQA":[110],"LegalBench)":[112],"also":[114],"real":[115],"world":[116],"data":[117],"from":[118,124],"Meta":[119],"production":[120],"deployment.":[121],"The":[122],"results":[123],"our":[125],"study":[127],"significantly":[131],"outperforms":[132],"standard":[133],"Universal":[134],"Self-Consistency.":[135],"Notably,":[136],"81%":[137],"of":[138],"the":[139],"pipeline's":[140],"suggestions":[141],"were":[142,152],"preferred":[143],"over":[144],"human-crafted":[145],"ground":[146],"truth,":[147],"recall":[150],"failures":[151],"virtually":[153],"eliminated.":[154]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-15T00:00:00"}
