{"id":"https://openalex.org/W7151581071","doi":"https://doi.org/10.48550/arxiv.2604.03473","title":"Evolutionary Search for Automated Design of Uncertainty Quantification Methods","display_name":"Evolutionary Search for Automated Design of Uncertainty Quantification Methods","publication_year":2026,"publication_date":"2026-04-03","ids":{"openalex":"https://openalex.org/W7151581071","doi":"https://doi.org/10.48550/arxiv.2604.03473"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.03473","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03473","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.03473","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133066849","display_name":"Mikhail Seleznyov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Seleznyov, Mikhail","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133090688","display_name":"Daniil Korbut","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Korbut, Daniil","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133089074","display_name":"Viktor Moskvoretskii","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Moskvoretskii, Viktor","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092596475","display_name":"Oleg Somov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Somov, Oleg","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133076306","display_name":"Alexander Panchenko","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Panchenko, Alexander","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133079559","display_name":"Elena Tutubalina","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tutubalina, Elena","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.5690000057220459,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.5690000057220459,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.273499995470047,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.02410000003874302,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.5943999886512756},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5494999885559082},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5101000070571899},{"id":"https://openalex.org/keywords/evolutionary-algorithm","display_name":"Evolutionary algorithm","score":0.4650999903678894},{"id":"https://openalex.org/keywords/evolutionary-computation","display_name":"Evolutionary computation","score":0.4359999895095825},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.4002000093460083},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.35249999165534973},{"id":"https://openalex.org/keywords/genetic-programming","display_name":"Genetic programming","score":0.33469998836517334}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6165000200271606},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.5943999886512756},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5800999999046326},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5494999885559082},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.546500027179718},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5101000070571899},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.4650999903678894},{"id":"https://openalex.org/C105902424","wikidata":"https://www.wikidata.org/wiki/Q1197129","display_name":"Evolutionary computation","level":2,"score":0.4359999895095825},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.4002000093460083},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3801000118255615},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.35249999165534973},{"id":"https://openalex.org/C110332635","wikidata":"https://www.wikidata.org/wiki/Q629498","display_name":"Genetic programming","level":2,"score":0.33469998836517334},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.3321000039577484},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3221000134944916},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.31310001015663147},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.31290000677108765},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.30230000615119934},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.2777999937534332},{"id":"https://openalex.org/C8880873","wikidata":"https://www.wikidata.org/wiki/Q187787","display_name":"Genetic algorithm","level":2,"score":0.2741999924182892},{"id":"https://openalex.org/C32230216","wikidata":"https://www.wikidata.org/wiki/Q7882499","display_name":"Uncertainty quantification","level":2,"score":0.2669999897480011},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.26190000772476196},{"id":"https://openalex.org/C35129592","wikidata":"https://www.wikidata.org/wiki/Q324793","display_name":"Memetic algorithm","level":3,"score":0.2612000107765198},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.03473","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03473","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.03473","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03473","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Uncertainty":[0],"quantification":[1],"(UQ)":[2],"methods":[3,34,48],"for":[4,134],"large":[5],"language":[6],"models":[7,79],"are":[8],"predominantly":[9],"designed":[10],"by":[11],"hand":[12],"based":[13],"on":[14],"domain":[15],"knowledge":[16],"and":[17,22,90,100],"heuristics,":[18],"limiting":[19],"their":[20],"scalability":[21],"generality.":[23],"We":[24],"apply":[25],"LLM-powered":[26,127],"evolutionary":[27,76,128],"search":[28,129],"to":[29,55,108,119],"automatically":[30],"discover":[31],"unsupervised":[32],"UQ":[33],"represented":[35],"as":[36],"Python":[37],"programs.":[38],"On":[39],"the":[40],"task":[41],"of":[42],"atomic":[43],"claim":[44],"verification,":[45],"our":[46,123],"evolved":[47],"outperform":[49],"strong":[50],"manually-designed":[51],"baselines,":[52],"achieving":[53],"up":[54],"6.7%":[56],"relative":[57,118],"ROC-AUC":[58],"improvement":[59],"across":[60],"9":[61],"datasets":[62],"while":[63,85],"generalizing":[64],"robustly":[65],"out-of-distribution.":[66],"Qualitative":[67],"analysis":[68],"reveals":[69],"that":[70,126],"different":[71],"LLMs":[72],"employ":[73],"qualitatively":[74],"distinct":[75],"strategies:":[77],"Claude":[78],"consistently":[80],"design":[81],"high-feature-count":[82],"linear":[83],"estimators,":[84],"Gpt-oss-120B":[86],"gravitates":[87],"toward":[88],"simpler":[89],"more":[91],"interpretable":[92,136],"positional":[93],"weighting":[94],"schemes.":[95],"Surprisingly,":[96],"only":[97],"Sonnet":[98],"4.5":[99,102],"Opus":[101,112],"reliably":[103],"leverage":[104],"increased":[105],"method":[106],"complexity":[107],"improve":[109],"performance":[110],"--":[111],"4.6":[113],"shows":[114],"an":[115],"unexpected":[116],"regression":[117],"its":[120],"predecessor.":[121],"Overall,":[122],"results":[124],"indicate":[125],"is":[130],"a":[131],"promising":[132],"paradigm":[133],"automated,":[135],"hallucination":[137],"detector":[138],"design.":[139]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-08T00:00:00"}
