{"id":"https://openalex.org/W4407209053","doi":"https://doi.org/10.1145/3701716.3715212","title":"ClarAVy: A Tool for Scalable and Accurate Malware Family Labeling","display_name":"ClarAVy: A Tool for Scalable and Accurate Malware Family Labeling","publication_year":2025,"publication_date":"2025-05-08","ids":{"openalex":"https://openalex.org/W4407209053","doi":"https://doi.org/10.1145/3701716.3715212"},"language":"en","primary_location":{"id":"doi:10.1145/3701716.3715212","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3701716.3715212","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3701716.3715212","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion Proceedings of the ACM on Web Conference 2025","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3701716.3715212","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008388322","display_name":"Robert J. Joyce","orcid":"https://orcid.org/0009-0003-7168-1237"},"institutions":[{"id":"https://openalex.org/I1322124587","display_name":"Booz Allen Hamilton (United States)","ror":"https://ror.org/051rcp357","country_code":"US","type":"company","lineage":["https://openalex.org/I1322124587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Robert J. Joyce","raw_affiliation_strings":["Booz Allen Hamilton, McLean, VA, USA"],"raw_orcid":"https://orcid.org/0009-0003-7168-1237","affiliations":[{"raw_affiliation_string":"Booz Allen Hamilton, McLean, VA, USA","institution_ids":["https://openalex.org/I1322124587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080234803","display_name":"D. Everett","orcid":"https://orcid.org/0000-0003-3593-5255"},"institutions":[{"id":"https://openalex.org/I1322124587","display_name":"Booz Allen Hamilton (United States)","ror":"https://ror.org/051rcp357","country_code":"US","type":"company","lineage":["https://openalex.org/I1322124587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Derek Everett","raw_affiliation_strings":["Booz Allen Hamilton, McLean, VA, USA"],"raw_orcid":"https://orcid.org/0000-0003-3593-5255","affiliations":[{"raw_affiliation_string":"Booz Allen Hamilton, McLean, VA, USA","institution_ids":["https://openalex.org/I1322124587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043932284","display_name":"Maya Fuchs","orcid":"https://orcid.org/0000-0002-0771-2647"},"institutions":[{"id":"https://openalex.org/I1322124587","display_name":"Booz Allen Hamilton (United States)","ror":"https://ror.org/051rcp357","country_code":"US","type":"company","lineage":["https://openalex.org/I1322124587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maya Fuchs","raw_affiliation_strings":["Booz Allen Hamilton, McLean, VA, USA"],"raw_orcid":"https://orcid.org/0000-0002-0771-2647","affiliations":[{"raw_affiliation_string":"Booz Allen Hamilton, McLean, VA, USA","institution_ids":["https://openalex.org/I1322124587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068036546","display_name":"Edward Raff","orcid":"https://orcid.org/0000-0002-9900-1972"},"institutions":[{"id":"https://openalex.org/I1322124587","display_name":"Booz Allen Hamilton (United States)","ror":"https://ror.org/051rcp357","country_code":"US","type":"company","lineage":["https://openalex.org/I1322124587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Edward Raff","raw_affiliation_strings":["Booz Allen Hamilton, McLean, VA, USA"],"raw_orcid":"https://orcid.org/0000-0002-9900-1972","affiliations":[{"raw_affiliation_string":"Booz Allen Hamilton, McLean, VA, USA","institution_ids":["https://openalex.org/I1322124587"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102861683","display_name":"James Holt","orcid":"https://orcid.org/0000-0002-6368-8696"},"institutions":[{"id":"https://openalex.org/I4210113003","display_name":"Physical Sciences (United States)","ror":"https://ror.org/021qvjc46","country_code":"US","type":"company","lineage":["https://openalex.org/I4210113003"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"James Holt","raw_affiliation_strings":["Laboratory for Physical Sciences, College Park, MD, USA"],"raw_orcid":"https://orcid.org/0000-0002-6368-8696","affiliations":[{"raw_affiliation_string":"Laboratory for Physical Sciences, College Park, MD, USA","institution_ids":["https://openalex.org/I4210113003"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.128,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.84398525,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"277","last_page":"286"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12034","display_name":"Digital and Cyber Forensics","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/malware","display_name":"Malware","score":0.8625068068504333},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.781241774559021},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6508780121803284},{"id":"https://openalex.org/keywords/alias","display_name":"Alias","score":0.43752941489219666},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43676891922950745},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.4134383201599121},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41289931535720825},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.32305946946144104},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.23191341757774353},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.17334625124931335}],"concepts":[{"id":"https://openalex.org/C541664917","wikidata":"https://www.wikidata.org/wiki/Q14001","display_name":"Malware","level":2,"score":0.8625068068504333},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.781241774559021},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6508780121803284},{"id":"https://openalex.org/C46681722","wikidata":"https://www.wikidata.org/wiki/Q4725589","display_name":"Alias","level":2,"score":0.43752941489219666},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43676891922950745},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.4134383201599121},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41289931535720825},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32305946946144104},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.23191341757774353},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.17334625124931335}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3701716.3715212","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3701716.3715212","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3701716.3715212","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion Proceedings of the ACM on Web Conference 2025","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2502.02759","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.02759","pdf_url":"https://arxiv.org/pdf/2502.02759","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3701716.3715212","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3701716.3715212","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3701716.3715212","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion Proceedings of the ACM on Web Conference 2025","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.5400000214576721,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4407209053.pdf","grobid_xml":"https://content.openalex.org/works/W4407209053.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W9014458","https://openalex.org/W1237542396","https://openalex.org/W1587106557","https://openalex.org/W1981221397","https://openalex.org/W1985690171","https://openalex.org/W2010065958","https://openalex.org/W2289453476","https://openalex.org/W2514847810","https://openalex.org/W2574793465","https://openalex.org/W2586493909","https://openalex.org/W2625739732","https://openalex.org/W2743988610","https://openalex.org/W2900633536","https://openalex.org/W2981292756","https://openalex.org/W3023980642","https://openalex.org/W3178593045","https://openalex.org/W3206660056","https://openalex.org/W4213097531","https://openalex.org/W4296068317","https://openalex.org/W4385688627","https://openalex.org/W4392607820","https://openalex.org/W6702333882","https://openalex.org/W6944430949"],"related_works":["https://openalex.org/W4385605198","https://openalex.org/W2151266859","https://openalex.org/W2056017980","https://openalex.org/W2333004434","https://openalex.org/W4256550813","https://openalex.org/W4400966522","https://openalex.org/W1557487237","https://openalex.org/W4248617250","https://openalex.org/W275149381","https://openalex.org/W2997042634"],"abstract_inverted_index":{"Determining":[0],"the":[1,137,143],"family":[2,66,86,108],"to":[3,97,113],"which":[4],"a":[5,93,101],"malicious":[6,125],"file":[7],"belongs":[8],"is":[9,23],"an":[10,71],"essential":[11],"component":[12],"of":[13,60,79,103],"cyberattack":[14],"investigation,":[15],"attribution,":[16],"and":[17,26,69,117,130,145],"remediation.":[18],"Performing":[19],"this":[20],"task":[21],"manually":[22],"time":[24],"consuming":[25],"requires":[27],"expert":[28],"knowledge.":[29],"Automated":[30],"tools":[31,54],"using":[32,36],"that":[33],"label":[34],"malware":[35,85,115],"antivirus":[37,61,73,104],"detections":[38,99],"lack":[39],"accuracy":[40,135],"and/or":[41],"scalability,":[42],"making":[43],"them":[44],"insufficient":[45],"for":[46],"real-world":[47],"applications.":[48],"Three":[49],"pervasive":[50],"shortcomings":[51],"in":[52,141],"these":[53],"are":[55],"responsible:":[56],"(1)":[57],"incorrect":[58],"parsing":[59],"detections,":[62],"(2)":[63],"errors":[64],"during":[65],"alias":[67],"resolution,":[68],"(3)":[70],"inappropriate":[72],"aggregation":[74],"strategy.":[75],"To":[76],"address":[77],"each":[78],"these,":[80],"we":[81,118],"created":[82],"our":[83],"own":[84],"labeling":[87,122,142],"tool":[88,111,140],"called":[89],"ClarAVy.":[90],"ClarAVy":[91,127],"utilizes":[92],"Variational":[94],"Bayesian":[95],"approach":[96],"aggregate":[98],"from":[100],"collection":[102],"products":[105],"into":[106],"accurate":[107],"labels.":[109],"Our":[110],"scales":[112],"enormous":[114],"datasets,":[116,147],"evaluated":[119],"it":[120],"by":[121],"?40":[123],"million":[124],"files.":[126],"has":[128],"8":[129],"12":[131],"percentage":[132],"points":[133],"higher":[134],"than":[136],"prior":[138],"leading":[139],"MOTIF":[144],"MalPedia":[146],"respectively.":[148]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
