{"id":"https://openalex.org/W4403487732","doi":"https://doi.org/10.3233/faia240685","title":"Target-driven Attack for Large Language Models","display_name":"Target-driven Attack for Large Language Models","publication_year":2024,"publication_date":"2024-10-16","ids":{"openalex":"https://openalex.org/W4403487732","doi":"https://doi.org/10.3233/faia240685"},"language":"en","primary_location":{"id":"doi:10.3233/faia240685","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia240685","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA240685","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA240685","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107249162","display_name":"Chong Zhang","orcid":"https://orcid.org/0000-0003-0497-8068"},"institutions":[{"id":"https://openalex.org/I69356397","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05","country_code":"CN","type":"education","lineage":["https://openalex.org/I69356397"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chong Zhang","raw_affiliation_strings":["Xi\u2019an Jiaotong-Liverpool University","Xi'an Jiaotong-Liverpool University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xi\u2019an Jiaotong-Liverpool University","institution_ids":["https://openalex.org/I69356397"]},{"raw_affiliation_string":"Xi'an Jiaotong-Liverpool University","institution_ids":["https://openalex.org/I69356397"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102521857","display_name":"Mingyu Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I4210096112","display_name":"Rutgers Sexual and Reproductive Health and Rights","ror":"https://ror.org/00rcvgx40","country_code":"NL","type":"other","lineage":["https://openalex.org/I4210096112"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Mingyu Jin","raw_affiliation_strings":["Rutgers University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Rutgers University","institution_ids":["https://openalex.org/I4210096112"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Dong Shu","orcid":null},"institutions":[{"id":"https://openalex.org/I155173764","display_name":"Rochester Institute of Technology","ror":"https://ror.org/00v4yb702","country_code":"US","type":"education","lineage":["https://openalex.org/I155173764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dong Shu","raw_affiliation_strings":["Northwestern University","Northwestern University d Rochester Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northwestern University","institution_ids":[]},{"raw_affiliation_string":"Northwestern University d Rochester Institute of Technology","institution_ids":["https://openalex.org/I155173764"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042945834","display_name":"T Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I155173764","display_name":"Rochester Institute of Technology","ror":"https://ror.org/00v4yb702","country_code":"US","type":"education","lineage":["https://openalex.org/I155173764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Taowen Wang","raw_affiliation_strings":["Rochester Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Rochester Institute of Technology","institution_ids":["https://openalex.org/I155173764"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101979292","display_name":"Dongfang Liu","orcid":"https://orcid.org/0000-0002-9624-8240"},"institutions":[{"id":"https://openalex.org/I155173764","display_name":"Rochester Institute of Technology","ror":"https://ror.org/00v4yb702","country_code":"US","type":"education","lineage":["https://openalex.org/I155173764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dongfang Liu","raw_affiliation_strings":["Rochester Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Rochester Institute of Technology","institution_ids":["https://openalex.org/I155173764"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011077051","display_name":"Xiaobo Jin","orcid":"https://orcid.org/0000-0003-1671-1379"},"institutions":[{"id":"https://openalex.org/I69356397","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05","country_code":"CN","type":"education","lineage":["https://openalex.org/I69356397"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaobo Jin","raw_affiliation_strings":["Xi\u2019an Jiaotong-Liverpool University","Xi'an Jiaotong-Liverpool University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Xi\u2019an Jiaotong-Liverpool University","institution_ids":["https://openalex.org/I69356397"]},{"raw_affiliation_string":"Xi'an Jiaotong-Liverpool University","institution_ids":["https://openalex.org/I69356397"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5011077051"],"corresponding_institution_ids":["https://openalex.org/I69356397"],"apc_list":null,"apc_paid":null,"fwci":2.119,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.8897141,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9735999703407288,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5368597507476807}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5368597507476807}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3233/faia240685","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia240685","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA240685","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},{"id":"pmh:oai:arXiv.org:2411.07268","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.07268","pdf_url":"https://arxiv.org/pdf/2411.07268","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.3233/faia240685","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia240685","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA240685","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4403487732.pdf"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W2799007037","https://openalex.org/W2799194071","https://openalex.org/W2898695519","https://openalex.org/W2962818281","https://openalex.org/W2963323070","https://openalex.org/W2963859254","https://openalex.org/W2964120615","https://openalex.org/W2982756474","https://openalex.org/W2996851481","https://openalex.org/W3035507081","https://openalex.org/W3097375194","https://openalex.org/W3098267758","https://openalex.org/W3101449015","https://openalex.org/W3105604018","https://openalex.org/W3134642945","https://openalex.org/W3170403598","https://openalex.org/W4225858632","https://openalex.org/W4287210714","https://openalex.org/W4287393336","https://openalex.org/W4309395891","https://openalex.org/W4312643954","https://openalex.org/W4322718191","https://openalex.org/W4323572061","https://openalex.org/W4323709479","https://openalex.org/W4379958452","https://openalex.org/W4380353722","https://openalex.org/W4381245716","https://openalex.org/W4385714464","https://openalex.org/W4386557007","https://openalex.org/W4387075795","https://openalex.org/W4387806231","https://openalex.org/W4388650587"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Current":[0],"large":[1,48],"language":[2,13,36],"models":[3],"(LLM)":[4],"provide":[5],"a":[6,47],"strong":[7],"foundation":[8],"for":[9],"large-scale":[10],"user-oriented":[11],"natural":[12],"tasks.":[14],"Many":[15],"users":[16],"can":[17],"easily":[18],"inject":[19],"adversarial":[20],"text":[21,107,111,137],"or":[22],"instructions":[23],"through":[24],"the":[25,35,40,73,97,101,105,109,114,119,130,135,140,143,149,153,180],"user":[26],"interface,":[27],"thus":[28,79],"causing":[29],"LLM":[30],"model":[31,37,82],"security":[32],"challenges":[33],"like":[34],"not":[38],"giving":[39],"correct":[41],"answer.":[42],"Although":[43],"there":[44],"is":[45,66],"currently":[46],"amount":[49],"of":[50,56,76,104,182],"research":[51],"on":[52,129,172],"black-box":[53,58,92,158],"attacks,":[54],"most":[55],"these":[57,69],"attacks":[59,77],"use":[60],"random":[61],"and":[62,78,108,138,167,177],"heuristic":[63],"strategies.":[64],"It":[65],"unclear":[67],"how":[68],"strategies":[70],"relate":[71],"to":[72,95,112,133,152],"success":[74],"rate":[75],"effectively":[80],"improve":[81],"robustness.":[83],"To":[84],"solve":[85,134],"this":[86],"problem,":[87],"we":[88],"propose":[89],"our":[90,183],"target-driven":[91,157],"attack":[93,110,131,136,154,159,163,184],"method":[94],"maximize":[96],"KL":[98],"divergence":[99],"between":[100],"conditional":[102],"probabilities":[103],"clean":[106],"redefine":[113],"attack\u2019s":[115],"goal.":[116],"We":[117],"transform":[118],"distance":[120],"maximization":[121],"problem":[122],"into":[123],"two":[124,162],"convex":[125],"optimization":[126],"problems":[127],"based":[128],"goal":[132],"estimate":[139],"covariance.":[141],"Furthermore,":[142],"projected":[144],"gradient":[145],"descent":[146],"algorithm":[147],"solves":[148],"vector":[150],"corresponding":[151],"text.":[155],"Our":[156],"approach":[160],"includes":[161],"strategies:":[164],"token":[165],"manipulation":[166],"misinformation":[168],"attack.":[169],"Experimental":[170],"results":[171],"multiple":[173],"Large":[174],"Language":[175],"Models":[176],"datasets":[178],"demonstrate":[179],"effectiveness":[181],"method.":[185]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
