{"id":"https://openalex.org/W7140314845","doi":"https://doi.org/10.48550/arxiv.2603.22717","title":"Does Teaming-Up LLMs Improve Secure Code Generation? A Comprehensive Evaluation with Multi-LLMSecCodeEval","display_name":"Does Teaming-Up LLMs Improve Secure Code Generation? A Comprehensive Evaluation with Multi-LLMSecCodeEval","publication_year":2026,"publication_date":"2026-03-24","ids":{"openalex":"https://openalex.org/W7140314845","doi":"https://doi.org/10.48550/arxiv.2603.22717"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22717","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22717","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22717","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089776133","display_name":"Bushra Sabir","orcid":"https://orcid.org/0000-0003-4303-5169"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sabir, Bushra","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130599832","display_name":"Shigang Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Shigang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067534316","display_name":"Seung Ick Jang","orcid":"https://orcid.org/0000-0002-0544-7982"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jang, Seung Ick","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123721316","display_name":"Sharif Abuadbba","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abuadbba, Sharif","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130549655","display_name":"Yansong Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Yansong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130612534","display_name":"Kristen Moore","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Moore, Kristen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130568999","display_name":"SangCheol Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, SangCheol","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130585518","display_name":"Hyoungshick Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Hyoungshick","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130617579","display_name":"Surya Nepal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nepal, Surya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.34630000591278076,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.34630000591278076,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.1662999987602234,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10734","display_name":"Information and Cyber Security","score":0.13570000231266022,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.6510999798774719},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6327000260353088},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5683000087738037},{"id":"https://openalex.org/keywords/vulnerability","display_name":"Vulnerability (computing)","score":0.5654000043869019},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.5303999781608582},{"id":"https://openalex.org/keywords/static-analysis","display_name":"Static analysis","score":0.3707999885082245},{"id":"https://openalex.org/keywords/security-analysis","display_name":"Security analysis","score":0.34150001406669617}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7343999743461609},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.6510999798774719},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6327000260353088},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5683000087738037},{"id":"https://openalex.org/C95713431","wikidata":"https://www.wikidata.org/wiki/Q631425","display_name":"Vulnerability (computing)","level":2,"score":0.5654000043869019},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.5303999781608582},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.43720000982284546},{"id":"https://openalex.org/C97686452","wikidata":"https://www.wikidata.org/wiki/Q7604153","display_name":"Static analysis","level":2,"score":0.3707999885082245},{"id":"https://openalex.org/C38369872","wikidata":"https://www.wikidata.org/wiki/Q7445009","display_name":"Security analysis","level":2,"score":0.34150001406669617},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3310000002384186},{"id":"https://openalex.org/C167063184","wikidata":"https://www.wikidata.org/wiki/Q1400839","display_name":"Vulnerability assessment","level":3,"score":0.2946999967098236},{"id":"https://openalex.org/C121822524","wikidata":"https://www.wikidata.org/wiki/Q5157582","display_name":"Computer security model","level":2,"score":0.28929999470710754},{"id":"https://openalex.org/C178489894","wikidata":"https://www.wikidata.org/wiki/Q8789","display_name":"Cryptography","level":2,"score":0.26759999990463257},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.25839999318122864},{"id":"https://openalex.org/C62913178","wikidata":"https://www.wikidata.org/wiki/Q7554361","display_name":"Software security assurance","level":4,"score":0.25209999084472656},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.25099998712539673},{"id":"https://openalex.org/C77109596","wikidata":"https://www.wikidata.org/wiki/Q4781497","display_name":"Application security","level":5,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22717","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22717","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22717","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22717","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Automatically":[0],"generating":[1],"source":[2],"code":[3,43,98,183],"from":[4,187,190],"natural":[5],"language":[6,9],"using":[7],"large":[8,174],"models":[10],"(LLMs)":[11],"is":[12],"becoming":[13],"common,":[14],"yet":[15],"security":[16,54,138],"vulnerabilities":[17],"persist":[18],"despite":[19],"advances":[20],"in":[21],"fine":[22],"tuning":[23],"and":[24,36,52,67,72,83,110,133,149],"prompting.":[25],"In":[26],"this":[27],"work,":[28],"we":[29,74],"systematically":[30],"evaluate":[31],"whether":[32],"multi":[33,169,193],"LLM":[34,102,116],"ensembles":[35,171],"collaborative":[37,118,150],"strategies":[38],"can":[39],"meaningfully":[40],"improve":[41,96],"secure":[42,97,182],"generation.":[44],"We":[45],"present":[46],"MULTI-LLMSECCODEEVAL,":[47],"a":[48],"framework":[49],"for":[50],"assessing":[51],"enhancing":[53],"across":[55],"the":[56,136,141],"vulnerability":[57],"management":[58],"lifecycle":[59],"by":[60,104,145,152],"combining":[61],"multiple":[62],"LLMs":[63],"with":[64,93],"static":[65,94],"analysis":[66,95],"structured":[68,168],"collaboration.":[69],"Using":[70],"SecLLMEval":[71,109],"SecLLMHolmes,":[73,113],"benchmark":[75],"ten":[76],"pipelines":[77,91,119,128],"spanning":[78],"single":[79,101],"model,":[80],"ensemble,":[81],"collaborative,":[82],"hybrid":[84],"designs.":[85],"Our":[86],"results":[87],"show":[88],"that":[89,129,159,181],"ensemble":[90,143],"augmented":[92],"generation":[99],"over":[100],"baselines":[103,151],"up":[105],"to":[106,125,147,154],"47.3%":[107],"on":[108,112],"19.3%":[111],"while":[114],"purely":[115],"based":[117],"yield":[120],"smaller":[121],"gains":[122],"of":[123],"8.9%":[124],"22.3%.":[126],"Hybrid":[127],"integrate":[130],"ensembling,":[131],"detection,":[132],"patching":[134],"achieve":[135],"strongest":[137],"performance,":[139],"outperforming":[140],"best":[142],"baseline":[144],"1.78%":[146],"4.72%":[148],"19.81%":[153],"26.78%.":[155],"Ablation":[156],"studies":[157],"reveal":[158],"model":[160,170,194],"scale":[161],"alone":[162],"does":[163,184],"not":[164,185],"ensure":[165],"security.":[166],"Smaller,":[167],"consistently":[172],"outperform":[173],"monolithic":[175],"LLMs.":[176],"Overall,":[177],"our":[178],"findings":[179],"demonstrate":[180],"emerge":[186],"scale,":[188],"but":[189],"carefully":[191],"orchestrated":[192],"system":[195],"design.":[196]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-26T00:00:00"}
