{"id":"https://openalex.org/W7162428322","doi":"https://doi.org/10.48550/arxiv.2605.25937","title":"Building an Adversarial Malware Dataset by Family and Type: Generation, Evasion, and Poisoning Evaluation","display_name":"Building an Adversarial Malware Dataset by Family and Type: Generation, Evasion, and Poisoning Evaluation","publication_year":2026,"publication_date":"2026-05-25","ids":{"openalex":"https://openalex.org/W7162428322","doi":"https://doi.org/10.48550/arxiv.2605.25937"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.25937","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25937","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.25937","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137027389","display_name":"David Ko\u0161\u0165\u00e1l","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ko\u0161\u0165\u00e1l, David","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5033203359","display_name":"Martin Jure\u010dek","orcid":"https://orcid.org/0000-0002-6546-8953"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jure\u010dek, Martin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.5392000079154968,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.5392000079154968,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.4424000084400177,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.0026000000070780516,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.9057999849319458},{"id":"https://openalex.org/keywords/malware","display_name":"Malware","score":0.7627999782562256},{"id":"https://openalex.org/keywords/evasion","display_name":"Evasion (ethics)","score":0.593500018119812},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.44999998807907104},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4496000111103058},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4422999918460846},{"id":"https://openalex.org/keywords/cryptovirology","display_name":"Cryptovirology","score":0.4124000072479248}],"concepts":[{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.9057999849319458},{"id":"https://openalex.org/C541664917","wikidata":"https://www.wikidata.org/wiki/Q14001","display_name":"Malware","level":2,"score":0.7627999782562256},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.6564000248908997},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6499000191688538},{"id":"https://openalex.org/C2781251061","wikidata":"https://www.wikidata.org/wiki/Q5416089","display_name":"Evasion (ethics)","level":3,"score":0.593500018119812},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46140000224113464},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.44999998807907104},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4496000111103058},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4422999918460846},{"id":"https://openalex.org/C84525096","wikidata":"https://www.wikidata.org/wiki/Q3506050","display_name":"Cryptovirology","level":3,"score":0.4124000072479248},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.40959998965263367},{"id":"https://openalex.org/C66905080","wikidata":"https://www.wikidata.org/wiki/Q17005494","display_name":"Binary classification","level":3,"score":0.3862999975681305},{"id":"https://openalex.org/C153180980","wikidata":"https://www.wikidata.org/wiki/Q19776675","display_name":"Commit","level":2,"score":0.36489999294281006},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3564000129699707},{"id":"https://openalex.org/C83860907","wikidata":"https://www.wikidata.org/wiki/Q135005","display_name":"Phishing","level":3,"score":0.3544999957084656},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.34790000319480896},{"id":"https://openalex.org/C2778403875","wikidata":"https://www.wikidata.org/wiki/Q20312394","display_name":"Adversarial machine learning","level":3,"score":0.33070001006126404},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3163999915122986}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.25937","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25937","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.25937","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.25937","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.5563684701919556,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,68],"present":[1],"a":[2,19,82],"dataset":[3,103,119],"of":[4,14,21,29,43,73,84,96,135],"adversarial":[5,22,30,55,90,128],"malware":[6,16,23,74,137],"samples":[7,35,91],"derived":[8],"from":[9,112],"the":[10,50,71,97,101,105,109,133],"public":[11],"RawMal-TF":[12],"collection":[13],"real-world":[15],"binaries.":[17],"Using":[18],"suite":[20],"generators,":[24],"we":[25],"construct":[26],"two":[27],"sets":[28],"PE":[31],"files:":[32],"44,347":[33],"family-labelled":[34,102],"and":[36,46,65,132],"33,596":[37],"type-labelled":[38],"samples,":[39],"achieving":[40],"evasion":[41,106],"rates":[42],"98.35":[44],"%":[45,48,95,114],"92.20":[47],"against":[49,108],"EMBER":[51,63],"classifier,":[52],"respectively.":[53],"Each":[54],"binary":[56],"is":[57,120],"accompanied":[58],"by":[59],"detailed":[60],"metadata,":[61],"including":[62],"scores":[64],"VirusTotal":[66],"classifications.":[67],"further":[69],"demonstrate":[70],"susceptibility":[72],"classification":[75],"pipelines":[76],"to":[77,115,123],"data":[78,99],"poisoning":[79,130],"attacks":[80],"through":[81],"series":[83],"training":[85,98],"experiments.":[86],"Injecting":[87],"fully":[88],"mislabelled":[89],"representing":[92],"only":[93],"0.5":[94],"in":[100],"increases":[104],"rate":[107],"re-trained":[110],"classifier":[111],"26.1":[113],"92.8":[116],"%.":[117],"The":[118],"publicly":[121],"released":[122],"facilitate":[124],"future":[125],"research":[126],"on":[127],"malware,":[129],"attacks,":[131],"robustness":[134],"machine-learning-based":[136],"detection":[138],"systems.":[139]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-27T00:00:00"}
