{"id":"https://openalex.org/W7163007755","doi":"https://doi.org/10.48550/arxiv.2605.30693","title":"Triaging Threats to Specialized Guardrails","display_name":"Triaging Threats to Specialized Guardrails","publication_year":2026,"publication_date":"2026-05-29","ids":{"openalex":"https://openalex.org/W7163007755","doi":"https://doi.org/10.48550/arxiv.2605.30693"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.30693","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.30693","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.30693","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137550184","display_name":"Wenjie Jacky Mo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mo, Wenjie Jacky","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137515901","display_name":"Xiaofei Wen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Xiaofei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137577187","display_name":"Rui Cai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Rui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137536246","display_name":"Boyu Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Boyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137554924","display_name":"Sicong Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Sicong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137611840","display_name":"Zihan Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zihan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137563993","display_name":"Minglai Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Minglai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137578344","display_name":"Zhe Zhao","orcid":"https://orcid.org/0000-0002-0781-0204"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Zhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137570552","display_name":"Muhao Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Muhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.8353999853134155,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.8353999853134155,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.025599999353289604,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.021900000050663948,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5647000074386597},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.5015000104904175},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.35589998960494995},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.310699999332428},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.302700012922287}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6297000050544739},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5647000074386597},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.5015000104904175},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.4068000018596649},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.37709999084472656},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.35589998960494995},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.310699999332428},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.302700012922287},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2824999988079071},{"id":"https://openalex.org/C2780428219","wikidata":"https://www.wikidata.org/wiki/Q16952335","display_name":"Cover (algebra)","level":2,"score":0.28130000829696655},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.2797999978065491}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.30693","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.30693","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.30693","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.30693","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.5718599557876587,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Building":[0],"robust":[1],"safety":[2,21],"guardrails":[3,46,83,118],"is":[4],"essential":[5],"for":[6,119],"deploying":[7],"Large":[8],"Language":[9],"Models":[10],"across":[11],"diverse":[12],"real-world":[13],"applications.":[14],"However,":[15],"this":[16],"goal":[17],"remains":[18,42],"challenging":[19],"because":[20],"risks":[22],"span":[23],"heterogeneous":[24],"threat":[25,89,128],"domains,":[26],"while":[27],"existing":[28],"datasets":[29],"cover":[30],"only":[31],"fragmented":[32],"risk":[33],"subsets":[34],"and":[35,139],"rely":[36],"on":[37,78],"inconsistent":[38],"taxonomies.":[39],"Consequently,":[40],"it":[41],"unclear":[43],"whether":[44],"current":[45],"can":[47],"generalize":[48],"beyond":[49],"narrow":[50],"evaluation":[51],"settings.":[52],"To":[53],"better":[54,135],"understand":[55],"the":[56],"robustness":[57],"of":[58],"guardrail":[59,132],"models,":[60],"we":[61],"first":[62],"introduce":[63],"GuardZoo,":[64],"a":[65,101,108],"unified":[66],"human-annotated":[67],"benchmark":[68],"with":[69],"32,460":[70],"samples":[71],"covering":[72],"15":[73],"distinct":[74,92],"unsafe":[75],"categories.":[76],"Evaluation":[77],"GuardZoo":[79],"reveals":[80],"that":[81,95,111,124],"monolithic":[82],"suffer":[84],"from":[85],"task":[86],"interference:":[87],"different":[88],"domains":[90],"require":[91],"decision":[93],"boundaries":[94],"are":[96],"difficult":[97],"to":[98,115,144],"compress":[99],"into":[100],"single":[102],"model.":[103],"We":[104],"therefore":[105],"propose":[106],"RouteGuard,":[107],"router-expert":[109],"framework":[110],"triages":[112],"each":[113],"conversation":[114],"specialized":[116],"expert":[117],"threat-specific":[120],"detection.":[121],"Experiments":[122],"show":[123],"RouteGuard":[125],"improves":[126],"fine-grained":[127],"detection":[129],"over":[130],"strong":[131],"baselines,":[133],"generalizes":[134],"under":[136],"out-of-domain":[137],"evaluation,":[138],"supports":[140],"flexible":[141],"modular":[142],"expansion":[143],"emerging":[145],"threats.":[146]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-06-02T00:00:00"}
