{"id":"https://openalex.org/W4412889630","doi":"https://doi.org/10.18653/v1/2025.acl-long.1571","title":"Merge Hijacking: Backdoor Attacks to Model Merging of Large Language Models","display_name":"Merge Hijacking: Backdoor Attacks to Model Merging of Large Language Models","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412889630","doi":"https://doi.org/10.18653/v1/2025.acl-long.1571"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2025.acl-long.1571","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.1571","pdf_url":"https://aclanthology.org/2025.acl-long.1571.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.acl-long.1571.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014040279","display_name":"Zenghui Yuan","orcid":"https://orcid.org/0000-0002-2839-9127"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zenghui Yuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011384152","display_name":"Y. P. Xu","orcid":"https://orcid.org/0000-0002-8476-9217"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yangming Xu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103250105","display_name":"Jiawen Shi","orcid":"https://orcid.org/0009-0009-9690-4293"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiawen Shi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100693197","display_name":"Pan Zhou","orcid":"https://orcid.org/0000-0002-8629-4622"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan Zhou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5015105117","display_name":"Lichao Sun","orcid":"https://orcid.org/0000-0003-1539-7939"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lichao Sun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7588,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.87799014,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"32688","last_page":"32703"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9075999855995178,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9075999855995178,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/backdoor","display_name":"Backdoor","score":0.9886472225189209},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7752851247787476},{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.7471692562103271},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.49064555764198303},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3257961869239807},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.1599298119544983}],"concepts":[{"id":"https://openalex.org/C2781045450","wikidata":"https://www.wikidata.org/wiki/Q254569","display_name":"Backdoor","level":2,"score":0.9886472225189209},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7752851247787476},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.7471692562103271},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.49064555764198303},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3257961869239807},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.1599298119544983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.acl-long.1571","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.1571","pdf_url":"https://aclanthology.org/2025.acl-long.1571.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.acl-long.1571","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-long.1571","pdf_url":"https://aclanthology.org/2025.acl-long.1571.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/5","score":0.5,"display_name":"Gender equality"}],"awards":[{"id":"https://openalex.org/G664739573","display_name":null,"funder_award_id":"62476107","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412889630.pdf","grobid_xml":"https://content.openalex.org/works/W4412889630.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4320031223","https://openalex.org/W4200629851","https://openalex.org/W4281902577","https://openalex.org/W4309417370","https://openalex.org/W4292107232","https://openalex.org/W3009072493","https://openalex.org/W4401407399"],"abstract_inverted_index":{"Model":[0],"merging":[1,36,54,109,122],"for":[2,22],"Large":[3],"Language":[4],"Models":[5],"(LLMs)":[6],"directly":[7],"fuses":[8],"the":[9,48,75,80,101,116],"parameters":[10],"of":[11,103],"different":[12,107],"models":[13,30],"finetuned":[14],"on":[15,32],"various":[16],"tasks,":[17],"creating":[18],"a":[19,59,66],"unified":[20],"model":[21,35,53,62,78],"multi-domain":[23],"tasks.However,":[24],"due":[25],"to":[26,39],"potential":[27],"vulnerabilities":[28],"in":[29,55],"available":[31],"open-source":[33],"platforms,":[34],"is":[37],"susceptible":[38],"backdoor":[40,50,81],"attacks.In":[41],"this":[42],"paper,":[43],"we":[44,113],"propose":[45],"Merge":[46],"Hijacking,":[47],"first":[49],"attack":[51,105,117,126],"targeting":[52],"LLMs.The":[56],"attacker":[57],"constructs":[58],"malicious":[60],"upload":[61],"and":[63,92,111,134,136],"releases":[64],"it.Once":[65],"victim":[67],"user":[68],"merges":[69],"it":[70],"with":[71],"any":[72],"other":[73],"models,":[74,108],"resulting":[76],"merged":[77],"inherits":[79],"while":[82],"maintaining":[83],"utility":[84],"across":[85,106],"tasks.Merge":[86],"Hijacking":[87],"defines":[88],"two":[89,130],"main":[90],"objectives-effectiveness":[91],"utility-and":[93],"achieves":[94],"them":[95],"through":[96],"four":[97],"steps.Extensive":[98],"experiments":[99],"demonstrate":[100],"effectiveness":[102],"our":[104,125],"algorithms,":[110],"tasks.Additionally,":[112],"show":[114],"that":[115],"remains":[118],"effective":[119],"even":[120],"when":[121],"real-world":[123],"models.Moreover,":[124],"demonstrates":[127],"robustness":[128],"against":[129],"inference-time":[131],"defenses":[132],"(Paraphrasing":[133],"CLEANGEN)":[135],"one":[137],"training-time":[138],"defense":[139],"(Fine-pruning).":[140]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
