{"id":"https://openalex.org/W7151298040","doi":"https://doi.org/10.48550/arxiv.2604.03962","title":"Predict, Don't React: Value-Based Safety Forecasting for LLM Streaming","display_name":"Predict, Don't React: Value-Based Safety Forecasting for LLM Streaming","publication_year":2026,"publication_date":"2026-04-05","ids":{"openalex":"https://openalex.org/W7151298040","doi":"https://doi.org/10.48550/arxiv.2604.03962"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.03962","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03962","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.03962","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031104941","display_name":"Pride Kavumba","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kavumba, Pride","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133083491","display_name":"Koki Wataoka","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wataoka, Koki","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101654553","display_name":"Huy H. Nguyen","orcid":"https://orcid.org/0000-0002-2000-7977"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nguyen, Huy H.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133134338","display_name":"Jiaxuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jiaxuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133105413","display_name":"Masaya Ohagi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ohagi, Masaya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5031104941"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3025999963283539,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3025999963283539,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.12280000001192093,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.11249999701976776,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/moderation","display_name":"Moderation","score":0.6279000043869019},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.5837000012397766},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5676000118255615},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.40290001034736633},{"id":"https://openalex.org/keywords/prefix","display_name":"Prefix","score":0.3970000147819519},{"id":"https://openalex.org/keywords/session","display_name":"Session (web analytics)","score":0.33500000834465027}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6894999742507935},{"id":"https://openalex.org/C93225998","wikidata":"https://www.wikidata.org/wiki/Q1941972","display_name":"Moderation","level":2,"score":0.6279000043869019},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.5837000012397766},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5676000118255615},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.40290001034736633},{"id":"https://openalex.org/C141603448","wikidata":"https://www.wikidata.org/wiki/Q134830","display_name":"Prefix","level":2,"score":0.3970000147819519},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.34540000557899475},{"id":"https://openalex.org/C2779182362","wikidata":"https://www.wikidata.org/wiki/Q17126187","display_name":"Session (web analytics)","level":2,"score":0.33500000834465027},{"id":"https://openalex.org/C19499675","wikidata":"https://www.wikidata.org/wiki/Q232207","display_name":"Monte Carlo method","level":2,"score":0.31349998712539673},{"id":"https://openalex.org/C2986160907","wikidata":"https://www.wikidata.org/wiki/Q220499","display_name":"Video streaming","level":2,"score":0.30559998750686646},{"id":"https://openalex.org/C30311675","wikidata":"https://www.wikidata.org/wiki/Q7622689","display_name":"Streaming current","level":3,"score":0.296099990606308},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.2935999929904938},{"id":"https://openalex.org/C112758219","wikidata":"https://www.wikidata.org/wiki/Q16038819","display_name":"Duration (music)","level":2,"score":0.2655999958515167},{"id":"https://openalex.org/C72868586","wikidata":"https://www.wikidata.org/wiki/Q5599587","display_name":"Great Moderation","level":3,"score":0.2590999901294708},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.25279998779296875}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.03962","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03962","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.03962","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03962","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.4024336040019989,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0,63],"many":[1],"practical":[2],"LLM":[3],"deployments,":[4],"a":[5,57,69,79,83,215],"single":[6],"guardrail":[7,73],"is":[8,239],"used":[9],"for":[10,122,126,179,244],"both":[11,121],"prompt":[12],"and":[13,125,143,167,177,200,214,234],"response":[14,25,58],"moderation.":[15,129],"Prompt":[16],"moderation":[17,26,77,124,226],"operates":[18],"on":[19],"fully":[20],"observed":[21],"text,":[22],"whereas":[23],"streaming":[24,38,72,127,145,159,212,225],"requires":[27],"safety":[28,116,246],"decisions":[29],"to":[30,50,141,150,153,172,188],"be":[31,228],"made":[32],"over":[33],"partial":[34,84],"generations.":[35],"Existing":[36],"text-based":[37],"guardrails":[39],"commonly":[40],"frame":[41],"this":[42,64,98],"output-side":[43],"problem":[44],"as":[45,78],"boundary":[46,112,232],"detection,":[47],"training":[48],"models":[49],"identify":[51],"the":[52,86,89,131,156,183],"earliest":[53],"prefix":[54],"at":[55],"which":[56,104],"has":[59],"already":[60],"become":[61],"unsafe.":[62],"work,":[65],"we":[66],"introduce":[67],"StreamGuard,":[68],"unified":[70],"model-agnostic":[71],"that":[74,193,222,235],"instead":[75],"formulates":[76],"forecasting":[80,236],"problem:":[81],"given":[82],"prefix,":[85],"model":[87,201],"predicts":[88],"expected":[90],"harmfulness":[91],"of":[92],"likely":[93],"future":[94,237],"continuations.":[95],"We":[96,190],"supervise":[97],"prediction":[99],"using":[100],"Monte":[101],"Carlo":[102],"rollouts,":[103],"enables":[105],"early":[106],"intervention":[107],"without":[108,230],"requiring":[109],"exact":[110,231],"token-level":[111],"annotations.":[113],"Across":[114],"standard":[115],"benchmarks,":[117],"StreamGuard":[118,134,161],"performs":[119],"strongly":[120],"input":[123],"output":[128],"At":[130],"8B":[132],"scale,":[133],"improves":[135],"aggregated":[136,144],"input-moderation":[137],"F1":[138,147],"from":[139,148,186],"86.7":[140],"88.2":[142],"output-moderation":[146],"80.4":[149],"81.9":[151],"relative":[152],"Qwen3Guard-Stream-8B-strict.":[154],"On":[155],"QWENGUARDTEST":[157],"response_loc":[158],"benchmark,":[160],"reaches":[162,207],"97.5":[163],"F1,":[164,174,210,213],"95.1":[165],"recall,":[166,176],"92.6%":[168],"on-time":[169],"intervention,":[170],"compared":[171],"95.9":[173],"92.1":[175],"89.9%":[178],"Qwen3Guard-Stream-8B-stric,":[180],"while":[181],"reducing":[182],"miss":[184,217],"rate":[185],"7.9%":[187],"4.9%.":[189],"further":[191],"show":[192,221],"forecasting-based":[194],"supervision":[195,242],"transfers":[196],"effectively":[197],"across":[198],"tokenizers":[199],"families:":[202],"with":[203],"transferred":[204],"targets,":[205],"Gemma3-StreamGuard-1B":[206],"81.3":[208],"response-moderation":[209],"98.2":[211],"3.5%":[216],"rate.":[218],"These":[219],"results":[220],"strong":[223],"end-to-end":[224],"can":[227],"obtained":[229],"labels,":[233],"risk":[238],"an":[240],"effective":[241],"strategy":[243],"low-latency":[245],"intervention.":[247]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-04-08T00:00:00"}
