{"id":"https://openalex.org/W7117235237","doi":"https://doi.org/10.1088/2632-2153/ae3103","title":"Simulation-based inference with deep ensembles: evaluating calibration uncertainty and detecting model misspecification","display_name":"Simulation-based inference with deep ensembles: evaluating calibration uncertainty and detecting model misspecification","publication_year":2025,"publication_date":"2025-12-24","ids":{"openalex":"https://openalex.org/W7117235237","doi":"https://doi.org/10.1088/2632-2153/ae3103"},"language":"en","primary_location":{"id":"doi:10.1088/2632-2153/ae3103","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/ae3103","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1088/2632-2153/ae3103","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"James Alvey","orcid":"https://orcid.org/0000-0003-2020-0803"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"James Alvey","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Carlo R Contaldi","orcid":"https://orcid.org/0000-0001-7285-0707"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Carlo R Contaldi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Mauro Pieroni","orcid":"https://orcid.org/0000-0003-0665-266X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mauro Pieroni","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1600,"currency":"GBP","value_usd":1962},"apc_paid":{"value":1600,"currency":"GBP","value_usd":1962},"fwci":2.5568,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.91798143,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"7","issue":"1","first_page":"015008","last_page":"015008"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.257999986410141,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.257999986410141,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.1688999980688095,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.1429000049829483,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6539000272750854},{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.6521999835968018},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.579200029373169},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.5755000114440918},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.5480999946594238},{"id":"https://openalex.org/keywords/bayesian-inference","display_name":"Bayesian inference","score":0.4860000014305115},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.48579999804496765},{"id":"https://openalex.org/keywords/point-estimation","display_name":"Point estimation","score":0.4706999957561493},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.45910000801086426},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.43309998512268066}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6539000272750854},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.6521999835968018},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5995000004768372},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.579200029373169},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.5755000114440918},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5516999959945679},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.5480999946594238},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4934000074863434},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4887000024318695},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.4860000014305115},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.48579999804496765},{"id":"https://openalex.org/C41426520","wikidata":"https://www.wikidata.org/wiki/Q1192065","display_name":"Point estimation","level":2,"score":0.4706999957561493},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.45910000801086426},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.43309998512268066},{"id":"https://openalex.org/C32230216","wikidata":"https://www.wikidata.org/wiki/Q7882499","display_name":"Uncertainty quantification","level":2,"score":0.4124999940395355},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.40849998593330383},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3765999972820282},{"id":"https://openalex.org/C917703","wikidata":"https://www.wikidata.org/wiki/Q7239668","display_name":"Predictive inference","level":5,"score":0.375},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.3522000014781952},{"id":"https://openalex.org/C95167961","wikidata":"https://www.wikidata.org/wiki/Q4483495","display_name":"Fiducial inference","level":5,"score":0.3425000011920929},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.33649998903274536},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32710000872612},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.31940001249313354},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.3190999925136566},{"id":"https://openalex.org/C134261354","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical inference","level":2,"score":0.3154999911785126},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C101112237","wikidata":"https://www.wikidata.org/wiki/Q4874481","display_name":"Bayesian statistics","level":4,"score":0.302700012922287},{"id":"https://openalex.org/C63002673","wikidata":"https://www.wikidata.org/wiki/Q2260590","display_name":"Scoring rule","level":2,"score":0.2994000017642975},{"id":"https://openalex.org/C162376815","wikidata":"https://www.wikidata.org/wiki/Q2158281","display_name":"Frequentist inference","level":4,"score":0.29600000381469727},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.28439998626708984},{"id":"https://openalex.org/C2777472644","wikidata":"https://www.wikidata.org/wiki/Q16968992","display_name":"Approximate inference","level":3,"score":0.27320000529289246},{"id":"https://openalex.org/C19499675","wikidata":"https://www.wikidata.org/wiki/Q232207","display_name":"Monte Carlo method","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.2696000039577484},{"id":"https://openalex.org/C167928553","wikidata":"https://www.wikidata.org/wiki/Q1376021","display_name":"Estimation theory","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2685999870300293},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.26759999990463257},{"id":"https://openalex.org/C137209882","wikidata":"https://www.wikidata.org/wiki/Q1403517","display_name":"Measurement uncertainty","level":2,"score":0.26330000162124634},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.25949999690055847},{"id":"https://openalex.org/C150921843","wikidata":"https://www.wikidata.org/wiki/Q1170431","display_name":"Resampling","level":2,"score":0.25130000710487366}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1088/2632-2153/ae3103","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/ae3103","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},{"id":"pmh:oai:digital.csic.es:10261/421742","is_oa":true,"landing_page_url":"http://hdl.handle.net/10261/421742","pdf_url":"https://digital.csic.es/bitstream/10261/421742/1/Alvey_2026_Mach._Learn.__Sci._Technol._7_015008.pdf","source":{"id":"https://openalex.org/S4306401639","display_name":"DIGITAL.CSIC (Spanish National Research Council (CSIC))","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I134820265","host_organization_name":"Consejo Superior de Investigaciones Cient\u00edficas","host_organization_lineage":["https://openalex.org/I134820265"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:doaj.org/article:92144a0ca2d84ebabce67145049a9fec","is_oa":true,"landing_page_url":"https://doaj.org/article/92144a0ca2d84ebabce67145049a9fec","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning: Science and Technology, Vol 7, Iss 1, p 015008 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1088/2632-2153/ae3103","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/ae3103","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320313831","display_name":"Comunidad de Madrid","ror":null},{"id":"https://openalex.org/F4320320283","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W28412257","https://openalex.org/W1534477342","https://openalex.org/W1678356000","https://openalex.org/W1965555277","https://openalex.org/W1988790447","https://openalex.org/W2071187610","https://openalex.org/W2100805904","https://openalex.org/W2148534890","https://openalex.org/W2155806188","https://openalex.org/W2167917621","https://openalex.org/W2787894218","https://openalex.org/W2789758093","https://openalex.org/W2959696098","https://openalex.org/W3031514878","https://openalex.org/W4212883601","https://openalex.org/W4287102281","https://openalex.org/W4387799659","https://openalex.org/W4388574730","https://openalex.org/W4390548146","https://openalex.org/W4394647992","https://openalex.org/W4399970888","https://openalex.org/W4406208238","https://openalex.org/W4409216285","https://openalex.org/W4409261143"],"related_works":[],"abstract_inverted_index":{"Abstract":[0],"Simulation-based":[1],"inference":[2,13],"(SBI)":[3],"offers":[4],"a":[5,33,42,85,106,155,171],"principled":[6],"and":[7,26,76,121,144,174],"flexible":[8],"framework":[9,169],"for":[10,100,104,123,177],"conducting":[11],"Bayesian":[12],"in":[14,47,113,161,183],"any":[15],"situation":[16],"where":[17],"forward":[18],"simulations":[19],"are":[20],"feasible.":[21],"However,":[22],"validating":[23],"the":[24,29,53,65,92,110,118,138,162,179],"accuracy":[25],"reliability":[27],"of":[28,56,109,181],"inferred":[30],"posteriors":[31],"remains":[32],"persistent":[34],"challenge.":[35],"In":[36],"this":[37,101,166],"work,":[38],"we":[39,83],"point":[40],"out":[41],"simple":[43],"diagnostic":[44,168],"approach":[45],"rooted":[46],"ensemble":[48],"learning":[49],"methods":[50],"to":[51,64],"assess":[52],"internal":[54],"consistency":[55,86],"SBI":[57,182],"outputs":[58],"that":[59,88],"does":[60],"not":[61],"require":[62],"access":[63],"true":[66],"posterior.":[67],"By":[68],"training":[69,119,163],"multiple":[70],"neural":[71],"estimators":[72,131],"under":[73],"identical":[74],"conditions":[75],"evaluating":[77],"their":[78],"pairwise":[79],"Kullback\u2013Leibler":[80],"(KL)":[81],"divergences,":[82],"define":[84],"criterion":[87],"quantifies":[89],"agreement":[90],"across":[91],"ensemble.":[93],"We":[94,135],"highlight":[95],"two":[96],"core":[97],"use":[98],"cases":[99],"framework:":[102],"(a)":[103],"generating":[105],"robust":[107],"estimate":[108],"systematic":[111],"uncertainty":[112],"parameter":[114],"reconstruction":[115],"associated":[116],"with":[117],"procedure,":[120],"(b)":[122],"detecting":[124],"possible":[125],"model":[126],"misspecification":[127],"when":[128],"using":[129],"trained":[130],"on":[132],"real":[133],"data.":[134],"also":[136],"demonstrate":[137],"relationship":[139],"between":[140],"significant":[141],"KL":[142],"divergences":[143],"issues":[145],"such":[146],"as":[147],"insufficient":[148],"convergence":[149],"due":[150],"to,":[151],"e.g.":[152],"too":[153],"low":[154],"simulation":[156],"budget,":[157],"or":[158],"intrinsic":[159],"variance":[160],"process.":[164],"Overall,":[165],"ensemble-based":[167],"provides":[170],"lightweight,":[172],"scalable,":[173],"model-agnostic":[175],"tool":[176],"enhancing":[178],"trustworthiness":[180],"scientific":[184],"applications.":[185]},"counts_by_year":[{"year":2026,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
