{"id":"https://openalex.org/W2000159976","doi":"https://doi.org/10.1145/2808769.2808780","title":"Better Malware Ground Truth","display_name":"Better Malware Ground Truth","publication_year":2015,"publication_date":"2015-10-06","ids":{"openalex":"https://openalex.org/W2000159976","doi":"https://doi.org/10.1145/2808769.2808780","mag":"2000159976"},"language":"en","primary_location":{"id":"doi:10.1145/2808769.2808780","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2808769.2808780","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2808769.2808780?download=true","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 8th ACM Workshop on Artificial Intelligence and Security","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/2808769.2808780?download=true","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033041590","display_name":"Alex Kantchelian","orcid":null},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alex Kantchelian","raw_affiliation_strings":["UC Berkeley, Berkeley, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UC Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088732631","display_name":"Michael Carl Tschantz","orcid":"https://orcid.org/0000-0003-1367-3784"},"institutions":[{"id":"https://openalex.org/I1297971548","display_name":"International Computer Science Institute","ror":"https://ror.org/01ewh7m12","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1297971548"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Carl Tschantz","raw_affiliation_strings":["International Computer Science Institute, Berkeley, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Computer Science Institute, Berkeley, CA, USA","institution_ids":["https://openalex.org/I1297971548"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003132155","display_name":"Sadia Afroz","orcid":"https://orcid.org/0000-0002-2485-548X"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sadia Afroz","raw_affiliation_strings":["UC Berkeley, Berkeley, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UC Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089038367","display_name":"Brad Miller","orcid":"https://orcid.org/0000-0001-8035-7437"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brad Miller","raw_affiliation_strings":["UC Berkeley, Berkeley, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UC Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112327867","display_name":"Vaishaal Shankar","orcid":null},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vaishaal Shankar","raw_affiliation_strings":["UC Berkeley, Berkeley, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UC Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051014263","display_name":"Rekha Bachwani","orcid":"https://orcid.org/0000-0003-4296-9592"},"institutions":[{"id":"https://openalex.org/I869089601","display_name":"Netflix (United States)","ror":"https://ror.org/0197qw696","country_code":"US","type":"company","lineage":["https://openalex.org/I869089601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rekha Bachwani","raw_affiliation_strings":["Netflix, San Francisco, CA, USA","Netflix, San Francisco, CA, USA#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Netflix, San Francisco, CA, USA","institution_ids":["https://openalex.org/I869089601"]},{"raw_affiliation_string":"Netflix, San Francisco, CA, USA#TAB#","institution_ids":["https://openalex.org/I869089601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017381278","display_name":"Anthony D. Joseph","orcid":"https://orcid.org/0000-0002-6798-9664"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anthony D. Joseph","raw_affiliation_strings":["UC Berkeley, Berkeley, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UC Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5113907559","display_name":"J. D. Tygar","orcid":null},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"J. D. Tygar","raw_affiliation_strings":["UC Berkeley, Berkeley, CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UC Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I134446601","https://openalex.org/I95457486"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":6.9591,"has_fulltext":true,"cited_by_count":89,"citation_normalized_percentile":{"value":0.97498419,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"45","last_page":"56"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.9012718200683594},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6863881349563599},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.5891659259796143},{"id":"https://openalex.org/keywords/malware","display_name":"Malware","score":0.5772181749343872},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5526363849639893},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.5367596745491028},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.5022029876708984},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4607246220111847},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.44878318905830383},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4171801209449768},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.139047771692276},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12066537141799927}],"concepts":[{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.9012718200683594},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6863881349563599},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.5891659259796143},{"id":"https://openalex.org/C541664917","wikidata":"https://www.wikidata.org/wiki/Q14001","display_name":"Malware","level":2,"score":0.5772181749343872},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5526363849639893},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.5367596745491028},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.5022029876708984},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4607246220111847},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.44878318905830383},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4171801209449768},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.139047771692276},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12066537141799927},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2808769.2808780","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2808769.2808780","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2808769.2808780?download=true","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 8th ACM Workshop on Artificial Intelligence and Security","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/2808769.2808780","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2808769.2808780","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2808769.2808780?download=true","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 8th ACM Workshop on Artificial Intelligence and Security","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.6000000238418579,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G4713059963","display_name":null,"funder_award_id":"FA8750","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G589244659","display_name":null,"funder_award_id":"XData Award FA8750-12-2-0331","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G6104336868","display_name":null,"funder_award_id":"0424422","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6284359468","display_name":null,"funder_award_id":"Award 7076018","funder_id":"https://openalex.org/F4320338292","funder_display_name":"Lawrence Berkeley National Laboratory"},{"id":"https://openalex.org/G6398089940","display_name":"Making Sense at Scale with Algorithms, Machines, and People","funder_award_id":"1139158","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7103680314","display_name":null,"funder_award_id":"FA8750-12-2-0331","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G7777668068","display_name":null,"funder_award_id":"0424422,1139158","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8560804567","display_name":null,"funder_award_id":"7076018","funder_id":"https://openalex.org/F4320338292","funder_display_name":"Lawrence Berkeley National Laboratory"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320307791","display_name":"Cisco Systems","ror":"https://ror.org/03yt1ez60"},{"id":"https://openalex.org/F4320316505","display_name":"NetApp","ror":"https://ror.org/05c4cm338"},{"id":"https://openalex.org/F4320316785","display_name":"VMware","ror":null},{"id":"https://openalex.org/F4320320952","display_name":"International Science and Technology Center","ror":"https://ror.org/03fn1w943"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320332195","display_name":"Samsung","ror":"https://ror.org/04w3jy968"},{"id":"https://openalex.org/F4320338292","display_name":"Lawrence Berkeley National Laboratory","ror":"https://ror.org/02jbv0t02"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2000159976.pdf","grobid_xml":"https://content.openalex.org/works/W2000159976.grobid-xml"},"referenced_works_count":68,"referenced_works":["https://openalex.org/W9014458","https://openalex.org/W36091977","https://openalex.org/W58852127","https://openalex.org/W62298501","https://openalex.org/W79549259","https://openalex.org/W85077918","https://openalex.org/W94487276","https://openalex.org/W101596157","https://openalex.org/W123019559","https://openalex.org/W192227941","https://openalex.org/W1519407765","https://openalex.org/W1581009051","https://openalex.org/W1586252162","https://openalex.org/W1591082683","https://openalex.org/W1773541209","https://openalex.org/W1827212170","https://openalex.org/W1851403712","https://openalex.org/W1879313991","https://openalex.org/W1966948031","https://openalex.org/W1978086230","https://openalex.org/W1987644478","https://openalex.org/W1988146703","https://openalex.org/W2003094813","https://openalex.org/W2010135967","https://openalex.org/W2042058229","https://openalex.org/W2042742130","https://openalex.org/W2050855115","https://openalex.org/W2057079516","https://openalex.org/W2060514845","https://openalex.org/W2063898900","https://openalex.org/W2077278164","https://openalex.org/W2082190528","https://openalex.org/W2092942461","https://openalex.org/W2094776491","https://openalex.org/W2097089247","https://openalex.org/W2103464385","https://openalex.org/W2112507308","https://openalex.org/W2114545736","https://openalex.org/W2116664070","https://openalex.org/W2117202485","https://openalex.org/W2118585731","https://openalex.org/W2120913037","https://openalex.org/W2121749752","https://openalex.org/W2122052811","https://openalex.org/W2125943921","https://openalex.org/W2126047957","https://openalex.org/W2129345386","https://openalex.org/W2129650357","https://openalex.org/W2138644293","https://openalex.org/W2142518823","https://openalex.org/W2144112223","https://openalex.org/W2149273804","https://openalex.org/W2152442131","https://openalex.org/W2164163973","https://openalex.org/W2165357553","https://openalex.org/W2170529403","https://openalex.org/W2203388234","https://openalex.org/W2400462880","https://openalex.org/W2401293755","https://openalex.org/W2482374127","https://openalex.org/W2483752640","https://openalex.org/W2484102177","https://openalex.org/W2534043454","https://openalex.org/W2596356468","https://openalex.org/W2596585349","https://openalex.org/W2597289420","https://openalex.org/W2604272474","https://openalex.org/W6604009900"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W2535204567","https://openalex.org/W4380551139","https://openalex.org/W2280377497","https://openalex.org/W3174044702","https://openalex.org/W4238433571","https://openalex.org/W2967848559","https://openalex.org/W4283803360","https://openalex.org/W4317695495"],"abstract_inverted_index":{"We":[0,48,60],"examine":[1],"the":[2,6,35,44,75],"problem":[3],"of":[4,8,37,71],"aggregating":[5],"results":[7],"multiple":[9],"anti-virus":[10],"(AV)":[11],"vendors'":[12],"detectors":[13],"into":[14],"a":[15,28,38],"single":[16],"authoritative":[17],"ground-truth":[18],"label":[19],"for":[20,55,74],"every":[21],"binary.":[22],"To":[23],"do":[24],"so,":[25],"we":[26],"adapt":[27],"well-known":[29],"generative":[30],"Bayesian":[31],"model":[32],"that":[33],"postulates":[34],"existence":[36],"hidden":[39],"ground":[40],"truth":[41],"upon":[42],"which":[43,72],"AV":[45],"labels":[46],"depend.":[47],"use":[49],"training":[50],"based":[51],"on":[52],"Expectation":[53],"Maximization":[54],"this":[56],"fully":[57],"unsupervised":[58],"technique.":[59],"evaluate":[61],"our":[62],"method":[63],"using":[64],"279,327":[65],"distinct":[66],"binaries":[67],"from":[68],"VirusTotal,":[69],"each":[70],"appeared":[73],"first":[76],"time":[77],"between":[78],"January":[79],"2012":[80],"and":[81],"June":[82],"2014.":[83]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":13},{"year":2019,"cited_by_count":12},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":6},{"year":2016,"cited_by_count":8},{"year":2015,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
