{"id":"https://openalex.org/W4402351907","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650172","title":"CRDA: Content Risk Drift Assessment of Large Language Models through Adversarial Multi-Agent Interaction","display_name":"CRDA: Content Risk Drift Assessment of Large Language Models through Adversarial Multi-Agent Interaction","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4402351907","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650172"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn60899.2024.10650172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn60899.2024.10650172","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079946956","display_name":"Zongzhen Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zongzhen Liu","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012435230","display_name":"Guoyi Li","orcid":"https://orcid.org/0000-0002-9228-4236"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guoyi Li","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101271961","display_name":"Bingkang Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bingkang Shi","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100356742","display_name":"Xiaodan Zhang","orcid":"https://orcid.org/0000-0001-7002-5447"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaodan Zhang","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051863970","display_name":"Jingguo Ge","orcid":"https://orcid.org/0000-0002-6648-324X"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingguo Ge","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004458037","display_name":"Yulei Wu","orcid":"https://orcid.org/0000-0003-0801-8443"},"institutions":[{"id":"https://openalex.org/I36234482","display_name":"University of Bristol","ror":"https://ror.org/0524sp257","country_code":"GB","type":"education","lineage":["https://openalex.org/I36234482"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yulei Wu","raw_affiliation_strings":["University of Bristol,School of Electrical, Electronic and Mechanical Engineering,Bristol,UK"],"affiliations":[{"raw_affiliation_string":"University of Bristol,School of Electrical, Electronic and Mechanical Engineering,Bristol,UK","institution_ids":["https://openalex.org/I36234482"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038712940","display_name":"Honglei Lyu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Honglei Lyu","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Cyberspace Security,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5079946956"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12890363,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9825000166893005,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.8225510716438293},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.717367947101593},{"id":"https://openalex.org/keywords/content","display_name":"Content (measure theory)","score":0.5856654644012451},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4263017773628235},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.40966010093688965},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08726221323013306}],"concepts":[{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.8225510716438293},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.717367947101593},{"id":"https://openalex.org/C2778152352","wikidata":"https://www.wikidata.org/wiki/Q5165061","display_name":"Content (measure theory)","level":2,"score":0.5856654644012451},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4263017773628235},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40966010093688965},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08726221323013306},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn60899.2024.10650172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn60899.2024.10650172","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W3100355250","https://openalex.org/W3105882417","https://openalex.org/W3173465197","https://openalex.org/W3176477796","https://openalex.org/W3184144760","https://openalex.org/W4283026156","https://openalex.org/W4285178342","https://openalex.org/W4285294723","https://openalex.org/W4292779060","https://openalex.org/W4366735819","https://openalex.org/W4384834458","https://openalex.org/W4385374425","https://openalex.org/W4385573759","https://openalex.org/W4385894687","https://openalex.org/W4386044169","https://openalex.org/W4387635776","https://openalex.org/W4387835442","https://openalex.org/W4389009378","https://openalex.org/W4391047179","https://openalex.org/W4392681182","https://openalex.org/W6778883912","https://openalex.org/W6838461927","https://openalex.org/W6851268924","https://openalex.org/W6852033271","https://openalex.org/W6853601813","https://openalex.org/W6855469472","https://openalex.org/W6855759525","https://openalex.org/W6856697067","https://openalex.org/W6857320562","https://openalex.org/W6860754476"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2502115930","https://openalex.org/W2482350142","https://openalex.org/W4246396837","https://openalex.org/W3126451824","https://openalex.org/W1561927205","https://openalex.org/W3191453585","https://openalex.org/W4297672492","https://openalex.org/W3204019825"],"abstract_inverted_index":{"As":[0,239],"Large":[1],"Language":[2],"Models":[3],"(LLMs)":[4],"continue":[5],"to":[6,48,86,128,256,284,330],"enhance":[7],"their":[8],"capabilities":[9],"in":[10,24,177,201,319,345,357],"multi-agent":[11,87],"collaborative":[12],"applications,":[13],"the":[14,17,49,66,78,112,153,165,171,181,188,240,251,261,274,288,292,320,326,331,340],"unpredictability":[15],"of":[16,51,80,105,143,155,159,167,185,191,208,260,306,315],"generative":[18,36],"content":[19,37,54,102,156,173,182,205,221,257,264],"risks":[20],"has":[21],"intensified.":[22],"Particularly":[23],"ongoing":[25],"interaction":[26],"scenarios":[27],"with":[28,70,174],"users,":[29],"it":[30],"remains":[31],"unclear":[32],"whether":[33],"there":[34],"is":[35],"risk":[38,55,103,157,183,206,222,258,266],"drift":[39,104,158,184,207,223,259,265],"over":[40],"time.":[41],"In":[42,90,147,297],"this":[43,91,148,160,195,346],"context,":[44],"\"drift":[45],"risk\"":[46],"refers":[47],"trend":[50],"progressively":[52],"intensified":[53],"that":[56,122,137,216,339],"emerges":[57],"during":[58,291,360],"sustained":[59],"adversarial":[60,73,88,117,132,199,241,295,302,334,361],"interactions":[61,133],"among":[62,134],"LLM":[63,135,150,193,279,358],"agents.":[64],"Additionally,":[65],"high":[67],"cost":[68],"associated":[69],"constructing":[71,115],"complex":[72,116],"environments":[74],"for":[75,84,100,114,352],"agents":[76,140,151,247,280,305,359],"impedes":[77],"transferability":[79],"current":[81],"assessment":[82,267],"methods":[83],"LLMs":[85,218,309],"scenarios.":[89],"paper,":[92],"we":[93,163,337],"introduce":[94],"a":[95,120,144,226,236],"low-cost":[96],"and":[97,125,170,203,286,299,317,342],"lightweight":[98],"framework":[99,341],"assessing":[101],"LLMs,":[106],"named":[107],"CRDA.":[108],"This":[109],"framework,":[110],"bypassing":[111],"need":[113],"environments,":[118],"offers":[119],"method":[121],"integrates":[123],"roles":[124,169,301],"responses":[126,178],"memory":[127,179],"guide":[129],"automatically":[130,293],"multi-round":[131,294],"agents,":[136],"is,":[138],"multiple":[139],"as":[141],"avatars":[142],"single":[145],"LLM.":[146,161,262],"approach,":[149],"enable":[152],"analysis":[154],"Moreover,":[162],"explore":[164],"impact":[166],"restricted":[168,245,298],"unsafe":[172],"negative":[175,285],"viewpoints":[176],"on":[180,354],"LLMs.":[186,212],"Considering":[187],"rapid":[189],"advancement":[190],"Chinese":[192,202,211,308],"capabilities,":[194],"study":[196],"selects":[197],"real":[198],"topics":[200],"assesses":[204],"five":[209,307],"representative":[210],"The":[213,263],"research":[214,353],"finds":[215],"these":[217],"exhibit":[219,310],"significant":[220],"even":[224],"after":[225],"certain":[227],"safety":[228,253,355],"alignment,":[229,254],"showing":[230],"an":[231,311],"initial":[232],"increase":[233,314],"followed":[234],"by":[235,272,325],"gradual":[237],"decrease.":[238],"process":[242],"progresses,":[243],"under":[244],"roles,":[246],"more":[248],"effectively":[249],"breach":[250],"model's":[252],"leading":[255],"can":[268],"be":[269],"quantified":[270],"specifically":[271],"measuring":[273],"deterioration":[275,322],"rate":[276,323],"at":[277],"which":[278],"deteriorate":[281],"from":[282],"positive":[283],"analyzing":[287],"underlying":[289],"trends":[290],"interactions.":[296,335],"general":[300],"interactions,":[303],"all":[304],"overall":[312],"average":[313],"31.5%":[316],"16.38%":[318],"cumulative":[321],"respectively":[324],"10th":[327],"round,":[328],"compared":[329],"baseline":[332],"no-roles":[333],"Finally,":[336],"hope":[338],"findings":[343],"presented":[344],"paper":[347],"will":[348],"offer":[349],"valuable":[350],"insights":[351],"alignment":[356],"processes.":[362]},"counts_by_year":[],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
