{"id":"https://openalex.org/W4414902901","doi":"https://doi.org/10.48550/arxiv.2503.15182","title":"Foundation models may exhibit staged progression in novel CBRN threat disclosure","display_name":"Foundation models may exhibit staged progression in novel CBRN threat disclosure","publication_year":2025,"publication_date":"2025-03-19","ids":{"openalex":"https://openalex.org/W4414902901","doi":"https://doi.org/10.48550/arxiv.2503.15182"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2503.15182","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.15182","pdf_url":"https://arxiv.org/pdf/2503.15182","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2503.15182","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078038225","display_name":"Kevin M. Esvelt","orcid":"https://orcid.org/0000-0001-8797-3945"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Esvelt, Kevin M","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5078038225"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10417","display_name":"Lung Cancer Treatments and Mutations","score":0.21619999408721924,"subfield":{"id":"https://openalex.org/subfields/2740","display_name":"Pulmonary and Respiratory Medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10417","display_name":"Lung Cancer Treatments and Mutations","score":0.21619999408721924,"subfield":{"id":"https://openalex.org/subfields/2740","display_name":"Pulmonary and Respiratory Medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sonnet","display_name":"Sonnet","score":0.6708999872207642},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.6560999751091003},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.43810001015663147},{"id":"https://openalex.org/keywords/web-site","display_name":"Web site","score":0.289000004529953}],"concepts":[{"id":"https://openalex.org/C38721330","wikidata":"https://www.wikidata.org/wiki/Q80056","display_name":"Sonnet","level":3,"score":0.6708999872207642},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.6560999751091003},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.43810001015663147},{"id":"https://openalex.org/C108827166","wikidata":"https://www.wikidata.org/wiki/Q175975","display_name":"Internet privacy","level":1,"score":0.43650001287460327},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.43149998784065247},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.397599995136261},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.38040000200271606},{"id":"https://openalex.org/C2984519610","wikidata":"https://www.wikidata.org/wiki/Q35127","display_name":"Web site","level":3,"score":0.289000004529953},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.2549999952316284},{"id":"https://openalex.org/C2778177712","wikidata":"https://www.wikidata.org/wiki/Q37707","display_name":"Haiku","level":3,"score":0.2493000030517578}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2503.15182","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.15182","pdf_url":"https://arxiv.org/pdf/2503.15182","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2503.15182","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2503.15182","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2503.15182","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.15182","pdf_url":"https://arxiv.org/pdf/2503.15182","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"extent":[1],"to":[2,16,22,53,97,141,169,174,196,206],"which":[3],"foundation":[4],"models":[5,168],"can":[6],"disclose":[7,170],"novel":[8,40,171],"chemical,":[9],"biological,":[10],"radiation,":[11],"and":[12,50,102],"nuclear":[13],"(CBRN)":[14],"threats":[15,173,201],"expert":[17,149],"users":[18,181],"is":[19,139],"unclear":[20],"due":[21],"a":[23,39,55,98,113,117],"lack":[24],"of":[25,70,135],"test":[26],"cases.":[27],"I":[28],"leveraged":[29],"the":[30,68],"unique":[31],"opportunity":[32],"presented":[33],"by":[34,112],"an":[35],"upcoming":[36],"publication":[37],"describing":[38],"catastrophic":[41],"biothreat":[42],"-":[43,52],"\"Technical":[44],"Report":[45],"on":[46],"Mirror":[47],"Bacteria:":[48],"Feasibility":[49],"Risks\"":[51],"conduct":[54],"small":[56],"controlled":[57],"study":[58],"before":[59,209],"it":[60],"became":[61],"public.":[62],"Graduate-trained":[63],"biologists":[64],"tasked":[65],"with":[66,124,147,158],"predicting":[67],"consequences":[69],"releasing":[71],"mirror":[72,144,185],"E.":[73],"coli":[74],"showed":[75],"no":[76],"significant":[77],"differences":[78],"in":[79],"rubric-graded":[80],"accuracy":[81],"using":[82],"Claude":[83],"Sonnet":[84,107,154],"3.5":[85],"new":[86,193],"(n=10)":[87],"or":[88,179],"web":[89,99],"search":[90],"only":[91,157,188],"(n=2);":[92],"both":[93],"groups":[94],"scored":[95],"comparably":[96],"baseline":[100],"(28":[101],"43":[103],"versus":[104,128],"36).":[105],"However,":[106],"reasoned":[108],"correctly":[109,155],"when":[110],"prompted":[111],"report":[114],"author,":[115],"but":[116],"smaller":[118],"model,":[119],"Haiku":[120,138],"3.5,":[121],"failed":[122],"even":[123,146],"author":[125],"guidance":[126,150],"(80":[127],"5).":[129],"These":[130],"results":[131],"suggest":[132],"distinct":[133],"stages":[134],"model":[136],"capability:":[137],"unable":[140],"reason":[142,197],"about":[143,198],"life":[145,186],"threat-aware":[148,159],"(Stage":[151,161,177,182],"1),":[152],"while":[153],"reasons":[156],"prompting":[160],"2).":[162],"Continued":[163],"advances":[164],"may":[165,202],"allow":[166,203],"future":[167],"CBRN":[172],"naive":[175],"experts":[176],"3)":[178],"unskilled":[180],"4).":[183],"While":[184],"represents":[187],"one":[189],"case":[190],"study,":[191],"monitoring":[192],"models'":[194],"ability":[195],"privately":[199],"known":[200],"protective":[204],"measures":[205],"be":[207],"implemented":[208],"widespread":[210],"disclosure.":[211]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
