{"id":"https://openalex.org/W7160059018","doi":"https://doi.org/10.48550/arxiv.2605.00699","title":"STARE: Step-wise Temporal Alignment and Red-teaming Engine for Multi-modal Toxicity Attack","display_name":"STARE: Step-wise Temporal Alignment and Red-teaming Engine for Multi-modal Toxicity Attack","publication_year":2026,"publication_date":"2026-05-01","ids":{"openalex":"https://openalex.org/W7160059018","doi":"https://doi.org/10.48550/arxiv.2605.00699"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.00699","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.00699","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.00699","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135235702","display_name":"Xutao Mao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mao, Xutao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135271602","display_name":"Liangjie Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Liangjie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135123255","display_name":"Tao Liu","orcid":"https://orcid.org/0009-0007-3720-1665"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Tao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135133734","display_name":"Xiang Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Xiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135248685","display_name":"Hongying Zan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zan, Hongying","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135256089","display_name":"Cong Cong Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Cong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.5360999703407288,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.5360999703407288,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.27959999442100525,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.026200000196695328,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.553600013256073},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.5322999954223633},{"id":"https://openalex.org/keywords/vulnerability","display_name":"Vulnerability (computing)","score":0.5289999842643738},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4855000078678131},{"id":"https://openalex.org/keywords/offensive","display_name":"Offensive","score":0.47699999809265137},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.44620001316070557},{"id":"https://openalex.org/keywords/toxicity","display_name":"Toxicity","score":0.40950000286102295},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.3977000117301941}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6420000195503235},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.553600013256073},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.5322999954223633},{"id":"https://openalex.org/C95713431","wikidata":"https://www.wikidata.org/wiki/Q631425","display_name":"Vulnerability (computing)","level":2,"score":0.5289999842643738},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4855000078678131},{"id":"https://openalex.org/C176856949","wikidata":"https://www.wikidata.org/wiki/Q2001676","display_name":"Offensive","level":2,"score":0.47699999809265137},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.44620001316070557},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41670000553131104},{"id":"https://openalex.org/C29730261","wikidata":"https://www.wikidata.org/wiki/Q274160","display_name":"Toxicity","level":2,"score":0.40950000286102295},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.3977000117301941},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.3797999918460846},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.29600000381469727},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2865000069141388},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2732999920845032},{"id":"https://openalex.org/C2777363581","wikidata":"https://www.wikidata.org/wiki/Q15098235","display_name":"Harm","level":2,"score":0.26989999413490295},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.2685000002384186},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2653999924659729},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.2603999972343445},{"id":"https://openalex.org/C2778751112","wikidata":"https://www.wikidata.org/wiki/Q835016","display_name":"Window (computing)","level":2,"score":0.251800000667572},{"id":"https://openalex.org/C76178495","wikidata":"https://www.wikidata.org/wiki/Q4808784","display_name":"Asset (computer security)","level":2,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.00699","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.00699","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.00699","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.00699","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.662182629108429,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Red-teaming":[0],"Vision-Language":[1],"Models":[2],"is":[3,150],"essential":[4],"for":[5,190],"identifying":[6],"vulnerabilities":[7],"where":[8],"adversarial":[9,120],"image-text":[10],"inputs":[11],"trigger":[12],"toxic":[13,38,201],"outputs.":[14],"Existing":[15],"approaches":[16],"treat":[17],"image":[18],"generation":[19],"as":[20,58],"a":[21,47,63,74,90,151,157,170,174,183,188],"black":[22],"box,":[23],"returning":[24],"only":[25],"terminal":[26],"toxicity":[27,143,167],"scores":[28],"and":[29,36,67,100,129,187],"leaving":[30],"open":[31],"the":[32,54,59,109,161],"question":[33],"of":[34,137,160,177,200],"when":[35],"how":[37],"semantics":[39],"emerge":[40],"during":[41],"multi-step":[42],"synthesis.":[43],"We":[44],"introduce":[45],"STARE,":[46],"hierarchical":[48,162],"reinforcement":[49],"learning":[50],"framework":[51],"that":[52,146,203],"treats":[53],"denoising":[55],"trajectory":[56],"itself":[57],"attack":[60,185],"surface,":[61],"under":[62],"direct":[64],"white-box":[65,101],"T2I":[66,80],"query-only":[68],"black-box":[69,99],"VLM":[70],"setting.":[71],"By":[72],"coupling":[73],"high-level":[75],"prompt":[76],"editor":[77],"with":[78],"low-level":[79],"fine-tuning":[81],"via":[82],"Group":[83],"Relative":[84],"Policy":[85],"Optimization":[86],"(GRPO),":[87],"STARE":[88],"attains":[89],"68%":[91],"improvement":[92],"in":[93],"Attack":[94],"Success":[95],"Rate":[96],"over":[97],"state-of-the-art":[98],"baselines.":[102],"More":[103],"importantly,":[104],"this":[105,147],"trajectory-level":[106],"view":[107],"surfaces":[108],"Optimization-Induced":[110],"Phase":[111],"Alignment":[112],"phenomenon:":[113],"vanilla":[114],"models":[115],"exhibit":[116],"diffuse":[117],"toxicity,":[118],"whereas":[119],"optimization":[121],"concentrates":[122],"conceptual":[123],"harms":[124,131],"into":[125,132,173],"early":[126],"semantic":[127],"phases":[128],"detail-oriented":[130],"late":[133],"refinement.":[134],"Targeted":[135],"perturbations":[136],"either":[138],"window":[139],"selectively":[140],"suppress":[141],"different":[142],"categories,":[144],"indicating":[145],"temporal":[148],"structure":[149],"genuine":[152],"causal":[153],"handle":[154],"rather":[155],"than":[156],"side":[158],"effect":[159],"design.":[163],"The":[164],"phenomenon":[165],"turns":[166],"formation":[168],"from":[169],"chaotic":[171],"process":[172],"small":[175],"set":[176],"predictable":[178],"vulnerability":[179],"windows,":[180],"providing":[181],"both":[182],"potent":[184],"engine":[186],"basis":[189],"phase-aware":[191],"safety":[192],"mechanisms.":[193],"Content":[194],"warning:":[195],"This":[196],"paper":[197],"contains":[198],"examples":[199],"content":[202],"may":[204],"be":[205],"offensive":[206],"or":[207],"disturbing.":[208]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-05T00:00:00"}
