{"id":"https://openalex.org/W7155157077","doi":"https://doi.org/10.48550/arxiv.2604.18976","title":"STAR-Teaming: A Strategy-Response Multiplex Network Approach to Automated LLM Red Teaming","display_name":"STAR-Teaming: A Strategy-Response Multiplex Network Approach to Automated LLM Red Teaming","publication_year":2026,"publication_date":"2026-04-21","ids":{"openalex":"https://openalex.org/W7155157077","doi":"https://doi.org/10.48550/arxiv.2604.18976"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.18976","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18976","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.18976","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134231472","display_name":"MinJae Jung","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jung, MinJae","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102079663","display_name":"Yongtaek Lim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lim, YongTaek","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126824319","display_name":"Chaeyun Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Chaeyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134218174","display_name":"Junghwan Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Junghwan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134271843","display_name":"Kihyun Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Kihyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134226112","display_name":"Minwoo Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Minwoo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5134231472"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3822000026702881,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3822000026702881,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.13910000026226044,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.0731000006198883,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.9158999919891357},{"id":"https://openalex.org/keywords/multiplex","display_name":"Multiplex","score":0.5699999928474426},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5641000270843506},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.4562000036239624},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.36899998784065247},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.3637999892234802}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.9158999919891357},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7304999828338623},{"id":"https://openalex.org/C2781188995","wikidata":"https://www.wikidata.org/wiki/Q6934982","display_name":"Multiplex","level":2,"score":0.5699999928474426},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5641000270843506},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49129998683929443},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.4562000036239624},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40220001339912415},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36910000443458557},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.36899998784065247},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.3637999892234802},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.33869999647140503},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.29739999771118164},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2628999948501587}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.18976","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18976","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.18976","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18976","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.5738596320152283,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"Large":[1],"Language":[2],"Models":[3],"(LLMs)":[4],"are":[5],"widely":[6],"used,":[7],"they":[8],"remain":[9],"susceptible":[10],"to":[11,53],"jailbreak":[12],"prompts":[13],"that":[14,33,107],"can":[15],"elicit":[16],"harmful":[17],"or":[18],"inappropriate":[19],"responses.":[20],"This":[21,58],"paper":[22],"introduces":[23],"STAR-Teaming,":[24],"a":[25,40,45,68,114,121],"novel":[26],"black-box":[27],"framework":[28],"for":[29,89],"automated":[30],"red":[31],"teaming":[32],"effectively":[34],"generates":[35],"such":[36],"prompts.":[37],"STAR-Teaming":[38,108],"integrates":[39],"Multi-Agent":[41],"System":[42],"(MAS)":[43],"with":[44],"Strategy-Response":[46],"Multiplex":[47,134],"Network":[48],"and":[49,84,130],"employs":[50],"network-driven":[51],"optimization":[52],"sample":[54],"effective":[55,90],"attack":[56,116],"strategies.":[57],"network-based":[59],"approach":[60],"recasts":[61],"the":[62,77,80,87,94,128,133],"intractable":[63],"high-dimensional":[64],"embedding":[65],"space":[66,96],"into":[67,97],"tractable":[69],"structure,":[70],"yielding":[71],"two":[72],"key":[73],"advantages:":[74],"it":[75,85],"enhances":[76],"interpretability":[78],"of":[79,132],"LLM's":[81],"strategic":[82],"vulnerabilities,":[83],"streamlines":[86],"search":[88,95],"strategies":[91],"by":[92],"organizing":[93],"semantic":[98],"communities,":[99],"thereby":[100],"preventing":[101],"redundant":[102],"exploration.":[103],"Empirical":[104],"results":[105],"demonstrate":[106],"significantly":[109],"surpasses":[110],"existing":[111],"methods,":[112],"achieving":[113],"higher":[115],"success":[117],"rate":[118],"(ASR)":[119],"at":[120,140],"lower":[122],"computational":[123],"cost.":[124],"Extensive":[125],"experiments":[126],"validate":[127],"effectiveness":[129],"explainability":[131],"Network.":[135],"The":[136],"code":[137],"is":[138],"available":[139],"https://github.com/selectstar-ai/STAR-Teaming-paper.":[141]},"counts_by_year":[],"updated_date":"2026-04-23T06:20:18.424754","created_date":"2026-04-23T00:00:00"}
