{"id":"https://openalex.org/W1971384109","doi":"https://doi.org/10.1109/bigdata.2014.7004290","title":"Hierarchical management of large-scale malware data","display_name":"Hierarchical management of large-scale malware data","publication_year":2014,"publication_date":"2014-10-01","ids":{"openalex":"https://openalex.org/W1971384109","doi":"https://doi.org/10.1109/bigdata.2014.7004290","mag":"1971384109"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2014.7004290","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2014.7004290","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061636802","display_name":"Lee Kellogg","orcid":null},"institutions":[{"id":"https://openalex.org/I137381566","display_name":"Charles River Laboratories (Netherlands)","ror":"https://ror.org/01tasya06","country_code":"NL","type":"company","lineage":["https://openalex.org/I137381566","https://openalex.org/I4210126295"]},{"id":"https://openalex.org/I4210149760","display_name":"Charles River Analytics (United States)","ror":"https://ror.org/03z47zw42","country_code":"US","type":"company","lineage":["https://openalex.org/I4210149760"]}],"countries":["NL","US"],"is_corresponding":false,"raw_author_name":"Lee Kellogg","raw_affiliation_strings":["Charles River Analytics, Cambridge, MA","Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Charles River Analytics, Cambridge, MA","institution_ids":["https://openalex.org/I4210149760"]},{"raw_affiliation_string":"Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138","institution_ids":["https://openalex.org/I137381566"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108256840","display_name":"Brian Ruttenberg","orcid":null},"institutions":[{"id":"https://openalex.org/I137381566","display_name":"Charles River Laboratories (Netherlands)","ror":"https://ror.org/01tasya06","country_code":"NL","type":"company","lineage":["https://openalex.org/I137381566","https://openalex.org/I4210126295"]},{"id":"https://openalex.org/I4210149760","display_name":"Charles River Analytics (United States)","ror":"https://ror.org/03z47zw42","country_code":"US","type":"company","lineage":["https://openalex.org/I4210149760"]}],"countries":["NL","US"],"is_corresponding":false,"raw_author_name":"Brian Ruttenberg","raw_affiliation_strings":["Charles River Analytics, Cambridge, MA","Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Charles River Analytics, Cambridge, MA","institution_ids":["https://openalex.org/I4210149760"]},{"raw_affiliation_string":"Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138","institution_ids":["https://openalex.org/I137381566"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072586846","display_name":"Alison O'Connor","orcid":null},"institutions":[{"id":"https://openalex.org/I137381566","display_name":"Charles River Laboratories (Netherlands)","ror":"https://ror.org/01tasya06","country_code":"NL","type":"company","lineage":["https://openalex.org/I137381566","https://openalex.org/I4210126295"]},{"id":"https://openalex.org/I4210149760","display_name":"Charles River Analytics (United States)","ror":"https://ror.org/03z47zw42","country_code":"US","type":"company","lineage":["https://openalex.org/I4210149760"]}],"countries":["NL","US"],"is_corresponding":false,"raw_author_name":"Alison O'Connor","raw_affiliation_strings":["Charles River Analytics, Cambridge, MA","Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Charles River Analytics, Cambridge, MA","institution_ids":["https://openalex.org/I4210149760"]},{"raw_affiliation_string":"Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138","institution_ids":["https://openalex.org/I137381566"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109448799","display_name":"Michael Howard","orcid":null},"institutions":[{"id":"https://openalex.org/I137381566","display_name":"Charles River Laboratories (Netherlands)","ror":"https://ror.org/01tasya06","country_code":"NL","type":"company","lineage":["https://openalex.org/I137381566","https://openalex.org/I4210126295"]},{"id":"https://openalex.org/I4210149760","display_name":"Charles River Analytics (United States)","ror":"https://ror.org/03z47zw42","country_code":"US","type":"company","lineage":["https://openalex.org/I4210149760"]}],"countries":["NL","US"],"is_corresponding":false,"raw_author_name":"Michael Howard","raw_affiliation_strings":["Charles River Analytics, Cambridge, MA","Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Charles River Analytics, Cambridge, MA","institution_ids":["https://openalex.org/I4210149760"]},{"raw_affiliation_string":"Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138","institution_ids":["https://openalex.org/I137381566"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054178937","display_name":"Avi Pfeffer","orcid":"https://orcid.org/0000-0002-6724-2640"},"institutions":[{"id":"https://openalex.org/I137381566","display_name":"Charles River Laboratories (Netherlands)","ror":"https://ror.org/01tasya06","country_code":"NL","type":"company","lineage":["https://openalex.org/I137381566","https://openalex.org/I4210126295"]},{"id":"https://openalex.org/I4210149760","display_name":"Charles River Analytics (United States)","ror":"https://ror.org/03z47zw42","country_code":"US","type":"company","lineage":["https://openalex.org/I4210149760"]}],"countries":["NL","US"],"is_corresponding":false,"raw_author_name":"Avi Pfeffer","raw_affiliation_strings":["Charles River Analytics, Cambridge, MA","Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Charles River Analytics, Cambridge, MA","institution_ids":["https://openalex.org/I4210149760"]},{"raw_affiliation_string":"Charles River Analytics 625 Mt. Auburn St, Cambridge, MA, 02138","institution_ids":["https://openalex.org/I137381566"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2949,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.52737028,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"4","issue":null,"first_page":"666","last_page":"674"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/malware","display_name":"Malware","score":0.9442113637924194},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8120559453964233},{"id":"https://openalex.org/keywords/malware-analysis","display_name":"Malware analysis","score":0.7579286098480225},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7432597279548645},{"id":"https://openalex.org/keywords/cryptovirology","display_name":"Cryptovirology","score":0.5258474946022034},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.514272153377533},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.46122246980667114},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.43604058027267456},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.4161871075630188},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.27116385102272034},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.2106124758720398}],"concepts":[{"id":"https://openalex.org/C541664917","wikidata":"https://www.wikidata.org/wiki/Q14001","display_name":"Malware","level":2,"score":0.9442113637924194},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8120559453964233},{"id":"https://openalex.org/C2779395397","wikidata":"https://www.wikidata.org/wiki/Q15731404","display_name":"Malware analysis","level":3,"score":0.7579286098480225},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7432597279548645},{"id":"https://openalex.org/C84525096","wikidata":"https://www.wikidata.org/wiki/Q3506050","display_name":"Cryptovirology","level":3,"score":0.5258474946022034},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.514272153377533},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.46122246980667114},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.43604058027267456},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.4161871075630188},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27116385102272034},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.2106124758720398},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2014.7004290","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2014.7004290","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320332467","display_name":"U.S. Air Force","ror":"https://ror.org/006gmme17"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W107173025","https://openalex.org/W154046626","https://openalex.org/W582454943","https://openalex.org/W1910686388","https://openalex.org/W1979400615","https://openalex.org/W1992110042","https://openalex.org/W1998081459","https://openalex.org/W2008324060","https://openalex.org/W2039346806","https://openalex.org/W2068224601","https://openalex.org/W2073308541","https://openalex.org/W2095351408","https://openalex.org/W2097706568","https://openalex.org/W2123402141","https://openalex.org/W2131681506","https://openalex.org/W2132069633","https://openalex.org/W2143306733","https://openalex.org/W2145056020","https://openalex.org/W2147717514","https://openalex.org/W2397770138","https://openalex.org/W2503400061","https://openalex.org/W3099768174","https://openalex.org/W4234536190","https://openalex.org/W6604386673","https://openalex.org/W6639864006","https://openalex.org/W6674647444","https://openalex.org/W6674657515","https://openalex.org/W6924999623"],"related_works":["https://openalex.org/W2469507153","https://openalex.org/W2008790809","https://openalex.org/W2768892939","https://openalex.org/W2160963033","https://openalex.org/W3022706011","https://openalex.org/W2909615516","https://openalex.org/W2249256574","https://openalex.org/W2397240470","https://openalex.org/W3128265165","https://openalex.org/W4210907385"],"abstract_inverted_index":{"As":[0],"the":[1,56,68,110,113,119,157],"pace":[2],"of":[3,5,43,48,55,67,77,112,121,133],"generation":[4],"new":[6,16,78],"malware":[7,14,29,35,60,79,94,135,146,159],"accelerates,":[8],"clustering":[9,85,103,137],"and":[10,33,39,72,139,148,153],"classifying":[11],"newly":[12],"discovered":[13],"requires":[15],"approaches":[17],"to":[18,27,30,97,127,150],"data":[19,114,130],"management.":[20],"We":[21,116],"describe":[22],"our":[23,49,91,122],"Big":[24],"Data":[25],"approach":[26,50,143],"managing":[28],"support":[31],"effective":[32],"efficient":[34,74],"analysis":[36,76],"on":[37],"large":[38],"rapidly":[40],"evolving":[41],"sets":[42],"malware.":[44],"The":[45],"key":[46],"element":[47],"is":[51],"a":[52,64],"hierarchical":[53,102],"organization":[54],"malware,":[57,71],"which":[58],"organizes":[59],"into":[61],"families,":[62],"maintains":[63],"rich":[65],"description":[66],"relationships":[69],"between":[70],"facilitates":[73],"online":[75],"as":[80,124],"they":[81],"are":[82],"discovered.":[83],"Using":[84],"evaluation":[86],"metrics,":[87],"we":[88],"show":[89,118],"that":[90],"system":[92,123],"discovers":[93],"families":[95],"comparable":[96],"those":[98],"produced":[99],"by":[100],"traditional":[101],"algorithms,":[104,138],"while":[105],"scaling":[106],"much":[107],"better":[108],"with":[109],"size":[111],"set.":[115],"also":[117],"flexibility":[120],"it":[125],"relates":[126],"substituting":[128],"various":[129],"representations,":[131],"methods":[132],"comparing":[134],"binaries,":[136],"other":[140],"factors.":[141],"Our":[142],"will":[144],"enable":[145],"analysts":[147],"investigators":[149],"quickly":[151],"understand":[152],"quantify":[154],"changes":[155],"in":[156],"global":[158],"ecosystem.":[160]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
