{"id":"https://openalex.org/W7156314891","doi":"https://doi.org/10.48550/arxiv.2604.21964","title":"Lessons from External Review of DeepMind's Scheming Inability Safety Case","display_name":"Lessons from External Review of DeepMind's Scheming Inability Safety Case","publication_year":2026,"publication_date":"2026-04-23","ids":{"openalex":"https://openalex.org/W7156314891","doi":"https://doi.org/10.48550/arxiv.2604.21964"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.21964","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21964","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.21964","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134718406","display_name":"Stephen Barrett","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barrett, Stephen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134703880","display_name":"Francisco Javier Campos Zabala","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zabala, Francisco Javier Campos","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121048982","display_name":"Sean P. Fillingham","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fillingham, Sean P.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036366006","display_name":"Umair Siddique","orcid":"https://orcid.org/0000-0001-6871-5289"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Siddique, Umair","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123658563","display_name":"James Walpole","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Walpole, James","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134728294","display_name":"Robin Bloomfield","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bloomfield, Robin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5116225220","display_name":"Henry Papadatos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Papadatos, Henry","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13295","display_name":"Safety Systems Engineering in Autonomy","score":0.8736000061035156,"subfield":{"id":"https://openalex.org/subfields/2213","display_name":"Safety, Risk, Reliability and Quality"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13295","display_name":"Safety Systems Engineering in Autonomy","score":0.8736000061035156,"subfield":{"id":"https://openalex.org/subfields/2213","display_name":"Safety, Risk, Reliability and Quality"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.039000000804662704,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.03269999846816063,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.6467000246047974},{"id":"https://openalex.org/keywords/harm","display_name":"Harm","score":0.6097000241279602},{"id":"https://openalex.org/keywords/incentive","display_name":"Incentive","score":0.5182999968528748},{"id":"https://openalex.org/keywords/affect","display_name":"Affect (linguistics)","score":0.47360000014305115},{"id":"https://openalex.org/keywords/safety-assurance","display_name":"Safety assurance","score":0.4496999979019165},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.421099990606308},{"id":"https://openalex.org/keywords/system-safety","display_name":"System safety","score":0.35440000891685486}],"concepts":[{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.6488000154495239},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.6467000246047974},{"id":"https://openalex.org/C2777363581","wikidata":"https://www.wikidata.org/wiki/Q15098235","display_name":"Harm","level":2,"score":0.6097000241279602},{"id":"https://openalex.org/C29122968","wikidata":"https://www.wikidata.org/wiki/Q1414816","display_name":"Incentive","level":2,"score":0.5182999968528748},{"id":"https://openalex.org/C2776035688","wikidata":"https://www.wikidata.org/wiki/Q1606558","display_name":"Affect (linguistics)","level":2,"score":0.47360000014305115},{"id":"https://openalex.org/C112805685","wikidata":"https://www.wikidata.org/wiki/Q10566551","display_name":"Safety assurance","level":2,"score":0.4496999979019165},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.42179998755455017},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.421099990606308},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.39399999380111694},{"id":"https://openalex.org/C39549134","wikidata":"https://www.wikidata.org/wiki/Q133080","display_name":"Public relations","level":1,"score":0.3626999855041504},{"id":"https://openalex.org/C132835097","wikidata":"https://www.wikidata.org/wiki/Q7663745","display_name":"System safety","level":2,"score":0.35440000891685486},{"id":"https://openalex.org/C106436119","wikidata":"https://www.wikidata.org/wiki/Q836575","display_name":"Quality assurance","level":3,"score":0.32589998841285706},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3172999918460846},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.30489999055862427},{"id":"https://openalex.org/C2994198235","wikidata":"https://www.wikidata.org/wiki/Q14493193","display_name":"Workplace safety","level":3,"score":0.30250000953674316},{"id":"https://openalex.org/C2780234205","wikidata":"https://www.wikidata.org/wiki/Q2281276","display_name":"Safety case","level":2,"score":0.30149999260902405},{"id":"https://openalex.org/C12174686","wikidata":"https://www.wikidata.org/wiki/Q1058438","display_name":"Risk assessment","level":2,"score":0.2754000127315521},{"id":"https://openalex.org/C195094911","wikidata":"https://www.wikidata.org/wiki/Q14167904","display_name":"Process management","level":1,"score":0.2743000090122223},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.2646999955177307},{"id":"https://openalex.org/C32896092","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Risk management","level":2,"score":0.2526000142097473},{"id":"https://openalex.org/C162118730","wikidata":"https://www.wikidata.org/wiki/Q1128453","display_name":"Actuarial science","level":1,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.21964","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21964","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.21964","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21964","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.7892756462097168,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Safety":[0],"cases":[1],"for":[2,88,98],"frontier":[3],"AI":[4,108],"systems":[5],"should":[6,102,110],"provide":[7,95,111],"a":[8],"convincing":[9],"argument,":[10],"supported":[11],"by":[12],"evidence,":[13],"that":[14,76],"the":[15,38,54,79,82],"risk":[16],"of":[17,40,63,81],"harm":[18],"is":[19],"within":[20],"an":[21,60],"acceptable":[22],"bound.":[23],"When":[24],"developers":[25,109],"author":[26],"their":[27],"own":[28],"safety":[29,69,83],"cases,":[30],"confirmation":[31],"bias":[32],"and":[33,85,105],"conflicted":[34],"incentives":[35],"can":[36,44],"affect":[37,78],"quality":[39],"argument.":[41],"External":[42],"review":[43,62,101],"help":[45],"to":[46,58,112],"address":[47],"this.":[48],"In":[49],"this":[50,92],"paper,":[51],"we":[52,94],"apply":[53],"Assurance":[55],"2.0":[56],"framework":[57],"perform":[59],"external":[61,100],"Google":[64],"DeepMind's":[65],"public":[66],"scheming":[67],"inability":[68],"case.":[70],"We":[71],"surface":[72],"substantive":[73],"new":[74],"concerns":[75],"materially":[77],"scope":[80],"case":[84],"its":[86],"applicability":[87],"decision-making.":[89],"Based":[90],"on":[91],"experience,":[93],"concrete":[96],"recommendations":[97],"how":[99],"be":[103],"conducted":[104],"what":[106],"information":[107],"support":[113],"it.":[114]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-28T00:00:00"}
