{"id":"https://openalex.org/W4398191955","doi":"https://doi.org/10.1145/3664646.3664764","title":"Measuring Impacts of Poisoning on Model Parameters and Embeddings for Large Language Models of Code","display_name":"Measuring Impacts of Poisoning on Model Parameters and Embeddings for Large Language Models of Code","publication_year":2024,"publication_date":"2024-07-10","ids":{"openalex":"https://openalex.org/W4398191955","doi":"https://doi.org/10.1145/3664646.3664764"},"language":"en","primary_location":{"id":"doi:10.1145/3664646.3664764","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664646.3664764","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st ACM International Conference on AI-Powered Software","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.11466","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003061205","display_name":"Aftab Hussain","orcid":"https://orcid.org/0009-0001-7415-9650"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aftab Hussain","raw_affiliation_strings":["University of Houston, Houston, USA"],"raw_orcid":"https://orcid.org/0009-0001-7415-9650","affiliations":[{"raw_affiliation_string":"University of Houston, Houston, USA","institution_ids":["https://openalex.org/I44461941"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016296157","display_name":"Md Rafiqul Islam Rabin","orcid":"https://orcid.org/0000-0001-5575-0528"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Md Rafiqul Islam Rabin","raw_affiliation_strings":["University of Houston, Houston, USA"],"raw_orcid":"https://orcid.org/0000-0001-5575-0528","affiliations":[{"raw_affiliation_string":"University of Houston, Houston, USA","institution_ids":["https://openalex.org/I44461941"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090034689","display_name":"Mohammad Amin Alipour","orcid":"https://orcid.org/0000-0002-6479-7202"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mohammad Amin Alipour","raw_affiliation_strings":["University of Houston, Houston, USA"],"raw_orcid":"https://orcid.org/0000-0002-6479-7202","affiliations":[{"raw_affiliation_string":"University of Houston, Houston, USA","institution_ids":["https://openalex.org/I44461941"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.3791,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.84472163,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"59","last_page":"64"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9854999780654907,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9842000007629395,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/backdoor","display_name":"Backdoor","score":0.9959390163421631},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.7335726022720337},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.647727906703949},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6410765647888184},{"id":"https://openalex.org/keywords/aka","display_name":"AKA","score":0.620974063873291},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.5374254584312439},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5105243921279907},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36142221093177795},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3242959976196289},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32056349515914917},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2102683186531067},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.0925341546535492}],"concepts":[{"id":"https://openalex.org/C2781045450","wikidata":"https://www.wikidata.org/wiki/Q254569","display_name":"Backdoor","level":2,"score":0.9959390163421631},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.7335726022720337},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.647727906703949},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6410765647888184},{"id":"https://openalex.org/C121158502","wikidata":"https://www.wikidata.org/wiki/Q4652161","display_name":"AKA","level":2,"score":0.620974063873291},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.5374254584312439},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5105243921279907},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36142221093177795},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3242959976196289},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32056349515914917},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2102683186531067},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0925341546535492},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C161191863","wikidata":"https://www.wikidata.org/wiki/Q199655","display_name":"Library science","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3664646.3664764","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664646.3664764","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st ACM International Conference on AI-Powered Software","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2405.11466","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.11466","pdf_url":"https://arxiv.org/pdf/2405.11466","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2405.11466","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.11466","pdf_url":"https://arxiv.org/pdf/2405.11466","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.4300000071525574}],"awards":[{"id":"https://openalex.org/G577096103","display_name":null,"funder_award_id":"W911NF20C0038","funder_id":"https://openalex.org/F4320333051","funder_display_name":"Intelligence Advanced Research Projects Activity"}],"funders":[{"id":"https://openalex.org/F4320332815","display_name":"Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320333051","display_name":"Intelligence Advanced Research Projects Activity","ror":"https://ror.org/01v3fsc55"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4398191955.pdf","grobid_xml":"https://content.openalex.org/works/W4398191955.grobid-xml"},"referenced_works_count":12,"referenced_works":["https://openalex.org/W2118020555","https://openalex.org/W2187089797","https://openalex.org/W2972135640","https://openalex.org/W2979792666","https://openalex.org/W2997591727","https://openalex.org/W3160638507","https://openalex.org/W3210860486","https://openalex.org/W4285077966","https://openalex.org/W4308627220","https://openalex.org/W4312044266","https://openalex.org/W4365799995","https://openalex.org/W4388229767"],"related_works":["https://openalex.org/W4320031223","https://openalex.org/W4200629851","https://openalex.org/W4281902577","https://openalex.org/W4309417370","https://openalex.org/W4292107232","https://openalex.org/W3009072493","https://openalex.org/W4386080799","https://openalex.org/W3140988292","https://openalex.org/W4317672133","https://openalex.org/W4386185023"],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"have":[4,14],"revolutionized":[5],"software":[6],"development":[7],"practices,":[8],"yet":[9],"concerns":[10],"about":[11],"their":[12],"safety":[13],"arisen,":[15],"particularly":[16],"regarding":[17],"hidden":[18],"backdoors,":[19],"aka":[20],"trojans.":[21],"Backdoor":[22],"attacks":[23],"involve":[24],"the":[25,36,39,49,71,92,123],"insertion":[26],"of":[27,38,70,87,115,120,125],"triggers":[28],"into":[29],"training":[30],"data,":[31],"allowing":[32],"attackers":[33],"to":[34,52,109],"manipulate":[35],"behavior":[37],"model":[40,50],"maliciously.":[41],"In":[42],"this":[43],"paper,":[44],"we":[45,61],"focus":[46],"on":[47],"analyzing":[48],"parameters":[51,126],"detect":[53],"potential":[54],"backdoor":[55,116],"signals":[56,117],"in":[57,84,112,118],"code":[58,121],"models.":[59,78],"Specifically,":[60],"examine":[62],"attention":[63,96],"weights":[64,97],"and":[65,67,73,76,98,127],"biases,":[66],"context":[68,85],"embeddings":[69,86],"clean":[72],"poisoned":[74,88,93],"CodeBERT":[75],"CodeT5":[77],"Our":[79],"results":[80],"suggest":[81],"noticeable":[82],"patterns":[83],"samples":[89],"for":[90],"both":[91],"models;":[94],"however,":[95],"biases":[99],"do":[100],"not":[101],"show":[102],"any":[103],"significant":[104],"differences.":[105],"This":[106],"work":[107],"contributes":[108],"ongoing":[110],"efforts":[111],"white-box":[113],"detection":[114],"LLMs":[119],"through":[122],"analysis":[124],"embeddings.":[128]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2024-05-22T00:00:00"}
