{"id":"https://openalex.org/W3157816830","doi":"https://doi.org/10.1109/ciss50987.2021.9400219","title":"Malware Subspecies Detection Method by Suffix Arrays and Machine Learning","display_name":"Malware Subspecies Detection Method by Suffix Arrays and Machine Learning","publication_year":2021,"publication_date":"2021-03-24","ids":{"openalex":"https://openalex.org/W3157816830","doi":"https://doi.org/10.1109/ciss50987.2021.9400219","mag":"3157816830"},"language":"en","primary_location":{"id":"doi:10.1109/ciss50987.2021.9400219","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ciss50987.2021.9400219","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 55th Annual Conference on Information Sciences and Systems (CISS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053344614","display_name":"K Kita","orcid":null},"institutions":[{"id":"https://openalex.org/I148798404","display_name":"Tokyo University of Technology","ror":"https://ror.org/021a26605","country_code":"JP","type":"education","lineage":["https://openalex.org/I148798404"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kouhei Kita","raw_affiliation_strings":["School of Computer Science, Tokyo University of Technology, Hachioji, Tokyo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science, Tokyo University of Technology, Hachioji, Tokyo, Japan","institution_ids":["https://openalex.org/I148798404"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108726661","display_name":"Ryuya Uda","orcid":null},"institutions":[{"id":"https://openalex.org/I148798404","display_name":"Tokyo University of Technology","ror":"https://ror.org/021a26605","country_code":"JP","type":"education","lineage":["https://openalex.org/I148798404"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Ryuya Uda","raw_affiliation_strings":["School of Computer Science, Tokyo University of Technology, Hachioji, Tokyo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science, Tokyo University of Technology, Hachioji, Tokyo, Japan","institution_ids":["https://openalex.org/I148798404"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.6177,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.65669144,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.97079998254776,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/malware","display_name":"Malware","score":0.9064587354660034},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7861771583557129},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5510200262069702},{"id":"https://openalex.org/keywords/n-gram","display_name":"n-gram","score":0.5495606064796448},{"id":"https://openalex.org/keywords/suffix","display_name":"Suffix","score":0.5218226313591003},{"id":"https://openalex.org/keywords/suffix-tree","display_name":"Suffix tree","score":0.4991023540496826},{"id":"https://openalex.org/keywords/static-analysis","display_name":"Static analysis","score":0.45393502712249756},{"id":"https://openalex.org/keywords/subspecies","display_name":"Subspecies","score":0.4529421031475067},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4209354519844055},{"id":"https://openalex.org/keywords/system-call","display_name":"System call","score":0.41191715002059937},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36828213930130005},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3569587469100952},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.21255746483802795},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.16569840908050537},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.14741092920303345},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.13639986515045166},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11578673124313354}],"concepts":[{"id":"https://openalex.org/C541664917","wikidata":"https://www.wikidata.org/wiki/Q14001","display_name":"Malware","level":2,"score":0.9064587354660034},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7861771583557129},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5510200262069702},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.5495606064796448},{"id":"https://openalex.org/C2779804580","wikidata":"https://www.wikidata.org/wiki/Q102047","display_name":"Suffix","level":2,"score":0.5218226313591003},{"id":"https://openalex.org/C2781166958","wikidata":"https://www.wikidata.org/wiki/Q1426863","display_name":"Suffix tree","level":3,"score":0.4991023540496826},{"id":"https://openalex.org/C97686452","wikidata":"https://www.wikidata.org/wiki/Q7604153","display_name":"Static analysis","level":2,"score":0.45393502712249756},{"id":"https://openalex.org/C17966761","wikidata":"https://www.wikidata.org/wiki/Q68947","display_name":"Subspecies","level":2,"score":0.4529421031475067},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4209354519844055},{"id":"https://openalex.org/C2778579508","wikidata":"https://www.wikidata.org/wiki/Q722192","display_name":"System call","level":2,"score":0.41191715002059937},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36828213930130005},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3569587469100952},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.21255746483802795},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.16569840908050537},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.14741092920303345},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.13639986515045166},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11578673124313354},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ciss50987.2021.9400219","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ciss50987.2021.9400219","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 55th Annual Conference on Information Sciences and Systems (CISS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6664433454","display_name":null,"funder_award_id":"JP18K11248","funder_id":"https://openalex.org/F4320320212","funder_display_name":"Japan Society for the Promotion of Science London"}],"funders":[{"id":"https://openalex.org/F4320320212","display_name":"Japan Society for the Promotion of Science London","ror":"https://ror.org/02m7axw05"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W192227941","https://openalex.org/W1558357780","https://openalex.org/W2121749752","https://openalex.org/W2144112223","https://openalex.org/W2153616611","https://openalex.org/W2301473744","https://openalex.org/W2325770265","https://openalex.org/W2444115772","https://openalex.org/W2518866423","https://openalex.org/W2712617220","https://openalex.org/W2744520801","https://openalex.org/W2789326120","https://openalex.org/W2792663539","https://openalex.org/W2894779647","https://openalex.org/W2965339432","https://openalex.org/W2968493742","https://openalex.org/W4394654479","https://openalex.org/W6633418244","https://openalex.org/W6678051712","https://openalex.org/W6745796943","https://openalex.org/W6766563997"],"related_works":["https://openalex.org/W3033292598","https://openalex.org/W2968586400","https://openalex.org/W1827256152","https://openalex.org/W2765174411","https://openalex.org/W3113361848","https://openalex.org/W2325770265","https://openalex.org/W1534710991","https://openalex.org/W2803049783","https://openalex.org/W2301473744","https://openalex.org/W3157816830"],"abstract_inverted_index":{"Malware":[0],"such":[1],"as":[2],"metamorphic":[3],"virus":[4],"changes":[5],"its":[6],"codes":[7],"and":[8,124,137],"it":[9],"cannot":[10],"be":[11,19,103],"detected":[12,20],"by":[13,21,65,121],"pattern":[14],"matching.":[15],"Such":[16],"malware":[17,79,101,117,134],"can":[18,102],"surface":[22,32,48],"analysis,":[23],"dynamic":[24],"analysis":[25,33,49],"or":[26],"static":[27],"analysis.":[28],"We":[29,127],"focused":[30],"on":[31],"since":[34,67],"neither":[35],"virtual":[36],"environments":[37],"nor":[38],"high":[39],"level":[40],"engineering":[41],"is":[42,50,69],"required.":[43],"A":[44],"representative":[45],"method":[46,120,130],"in":[47,72,96],"n-gram":[51,66,87,98],"with":[52,131,142],"machine":[53,125],"learning.":[54,126],"On":[55],"the":[56,106,129],"other":[57],"hand,":[58],"important":[59],"features":[60,88],"are":[61,82,108],"sometimes":[62],"cut":[63],"off":[64],"n":[68],"not":[70,83],"variable":[71],"some":[73,97],"existing":[74],"methods.":[75],"Hence,":[76],"scores":[77],"of":[78],"detection":[80,119],"methods":[81,107],"perfect.":[84],"Moreover,":[85],"creating":[86],"takes":[89],"long":[90],"time":[91],"for":[92],"comparing":[93],"files.":[94],"Furthermore,":[95],"methods,":[99],"invisible":[100],"created":[104],"when":[105],"known":[109],"to":[110,139],"attackers.":[111],"Therefore,":[112],"we":[113],"proposed":[114],"a":[115],"new":[116],"subspecies":[118,135],"suffix":[122],"arrays":[123],"evaluated":[128],"four":[132],"real":[133],"families":[136],"succeeded":[138],"classify":[140],"them":[141],"almost":[143],"100%":[144],"accuracy.":[145]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
