{"id":"https://openalex.org/W3046419603","doi":"https://doi.org/10.3390/make2030012","title":"Hierarchy-Based File Fragment Classification","display_name":"Hierarchy-Based File Fragment Classification","publication_year":2020,"publication_date":"2020-08-03","ids":{"openalex":"https://openalex.org/W3046419603","doi":"https://doi.org/10.3390/make2030012","mag":"3046419603"},"language":"en","primary_location":{"id":"doi:10.3390/make2030012","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make2030012","pdf_url":"https://www.mdpi.com/2504-4990/2/3/12/pdf?version=1596457979","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2504-4990/2/3/12/pdf?version=1596457979","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112988008","display_name":"Manish Bhatt","orcid":"https://orcid.org/0000-0002-3867-5180"},"institutions":[{"id":"https://openalex.org/I192396691","display_name":"University of New Orleans","ror":"https://ror.org/034mtvk83","country_code":"US","type":"education","lineage":["https://openalex.org/I192396691","https://openalex.org/I2799628689"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Manish Bhatt","raw_affiliation_strings":["Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA","institution_ids":["https://openalex.org/I192396691"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000961605","display_name":"Avdesh Mishra","orcid":"https://orcid.org/0000-0001-9666-8715"},"institutions":[{"id":"https://openalex.org/I181414168","display_name":"Texas A&M University \u2013 Kingsville","ror":"https://ror.org/05abs3w97","country_code":"US","type":"education","lineage":["https://openalex.org/I181414168"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Avdesh Mishra","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, Texas A&amp;M University-Kingsville, Kingsville, TX 78363, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, Texas A&amp;M University-Kingsville, Kingsville, TX 78363, USA","institution_ids":["https://openalex.org/I181414168"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057315913","display_name":"Md Wasi Ul Kabir","orcid":null},"institutions":[{"id":"https://openalex.org/I192396691","display_name":"University of New Orleans","ror":"https://ror.org/034mtvk83","country_code":"US","type":"education","lineage":["https://openalex.org/I192396691","https://openalex.org/I2799628689"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Md Wasi Ul Kabir","raw_affiliation_strings":["Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA","institution_ids":["https://openalex.org/I192396691"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019653582","display_name":"S. E. Blake-Gatto","orcid":null},"institutions":[{"id":"https://openalex.org/I192396691","display_name":"University of New Orleans","ror":"https://ror.org/034mtvk83","country_code":"US","type":"education","lineage":["https://openalex.org/I192396691","https://openalex.org/I2799628689"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"S. E. Blake-Gatto","raw_affiliation_strings":["Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA","institution_ids":["https://openalex.org/I192396691"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053958975","display_name":"Rishav Rajendra","orcid":null},"institutions":[{"id":"https://openalex.org/I192396691","display_name":"University of New Orleans","ror":"https://ror.org/034mtvk83","country_code":"US","type":"education","lineage":["https://openalex.org/I192396691","https://openalex.org/I2799628689"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rishav Rajendra","raw_affiliation_strings":["Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA","institution_ids":["https://openalex.org/I192396691"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055092646","display_name":"Md Tamjidul Hoque","orcid":"https://orcid.org/0000-0002-0110-2194"},"institutions":[{"id":"https://openalex.org/I192396691","display_name":"University of New Orleans","ror":"https://ror.org/034mtvk83","country_code":"US","type":"education","lineage":["https://openalex.org/I192396691","https://openalex.org/I2799628689"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Md Tamjidul Hoque","raw_affiliation_strings":["Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA"],"raw_orcid":"https://orcid.org/0000-0002-0110-2194","affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of New Orleans, 2000 Lakeshore Dr., New Orleans, LA 70148, USA","institution_ids":["https://openalex.org/I192396691"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063509441","display_name":"Irfan Ahmed","orcid":"https://orcid.org/0000-0001-5648-388X"},"institutions":[{"id":"https://openalex.org/I184840846","display_name":"Virginia Commonwealth University","ror":"https://ror.org/02nkdxk79","country_code":"US","type":"education","lineage":["https://openalex.org/I184840846"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Irfan Ahmed","raw_affiliation_strings":["Department of Computer Science, Virginia Commonwealth University, Richmond, VA 23284, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Virginia Commonwealth University, Richmond, VA 23284, USA","institution_ids":["https://openalex.org/I184840846"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5055092646"],"corresponding_institution_ids":["https://openalex.org/I192396691"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":2.5056,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.91627898,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"2","issue":"3","first_page":"216","last_page":"232"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12034","display_name":"Digital and Cyber Forensics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12034","display_name":"Digital and Cyber Forensics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8134608268737793},{"id":"https://openalex.org/keywords/hierarchy","display_name":"Hierarchy","score":0.6636985540390015},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.6249149441719055},{"id":"https://openalex.org/keywords/byte","display_name":"Byte","score":0.5218828320503235},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5000629425048828},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.4779660403728485},{"id":"https://openalex.org/keywords/base","display_name":"Base (topology)","score":0.4736779034137726},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.458626925945282},{"id":"https://openalex.org/keywords/fragment","display_name":"Fragment (logic)","score":0.4155043959617615},{"id":"https://openalex.org/keywords/file-format","display_name":"File format","score":0.41480717062950134},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.40450263023376465},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3383789658546448},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.23567861318588257},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1076059639453888},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10127297043800354},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09574541449546814}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8134608268737793},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.6636985540390015},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.6249149441719055},{"id":"https://openalex.org/C43364308","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Byte","level":2,"score":0.5218828320503235},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5000629425048828},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.4779660403728485},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.4736779034137726},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.458626925945282},{"id":"https://openalex.org/C2776235265","wikidata":"https://www.wikidata.org/wiki/Q18392052","display_name":"Fragment (logic)","level":2,"score":0.4155043959617615},{"id":"https://openalex.org/C97250363","wikidata":"https://www.wikidata.org/wiki/Q235557","display_name":"File format","level":2,"score":0.41480717062950134},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40450263023376465},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3383789658546448},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.23567861318588257},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1076059639453888},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10127297043800354},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09574541449546814},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/make2030012","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make2030012","pdf_url":"https://www.mdpi.com/2504-4990/2/3/12/pdf?version=1596457979","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:6122b7c51b0c4577a636b3b51fef8176","is_oa":true,"landing_page_url":"https://doaj.org/article/6122b7c51b0c4577a636b3b51fef8176","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning and Knowledge Extraction, Vol 2, Iss 3, Pp 216-232 (2020)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2504-4990/2/3/12/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/make2030012","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning and Knowledge Extraction; Volume 2; Issue 3; Pages: 216-232","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/make2030012","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make2030012","pdf_url":"https://www.mdpi.com/2504-4990/2/3/12/pdf?version=1596457979","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G332855101","display_name":null,"funder_award_id":"NSF grant # 1623276","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4798353591","display_name":null,"funder_award_id":"Board of Regents Support Fund LEQSF (2016-19)-RD-B-07","funder_id":"https://openalex.org/F4320309392","funder_display_name":"Louisiana Board of Regents"},{"id":"https://openalex.org/G6965536007","display_name":null,"funder_award_id":"1623276","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320309392","display_name":"Louisiana Board of Regents","ror":"https://ror.org/00jv89z46"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3046419603.pdf","grobid_xml":"https://content.openalex.org/works/W3046419603.grobid-xml"},"referenced_works_count":36,"referenced_works":["https://openalex.org/W77540285","https://openalex.org/W985774724","https://openalex.org/W1553407966","https://openalex.org/W1746799182","https://openalex.org/W1995875735","https://openalex.org/W2001762414","https://openalex.org/W2008835805","https://openalex.org/W2027166822","https://openalex.org/W2031685798","https://openalex.org/W2049050234","https://openalex.org/W2063862666","https://openalex.org/W2071484336","https://openalex.org/W2076342816","https://openalex.org/W2101347959","https://openalex.org/W2116773818","https://openalex.org/W2117991511","https://openalex.org/W2120932128","https://openalex.org/W2122956713","https://openalex.org/W2125371264","https://openalex.org/W2137833784","https://openalex.org/W2151554678","https://openalex.org/W2151958475","https://openalex.org/W2153635072","https://openalex.org/W2156909104","https://openalex.org/W2157888595","https://openalex.org/W2161406213","https://openalex.org/W2519674279","https://openalex.org/W2735332739","https://openalex.org/W2796263526","https://openalex.org/W2887831059","https://openalex.org/W2983181739","https://openalex.org/W3036399259","https://openalex.org/W4237490343","https://openalex.org/W4298236029","https://openalex.org/W6677731448","https://openalex.org/W6679033275"],"related_works":["https://openalex.org/W1973480752","https://openalex.org/W2805502594","https://openalex.org/W4253208712","https://openalex.org/W3132641048","https://openalex.org/W2217679042","https://openalex.org/W1603677234","https://openalex.org/W2525971763","https://openalex.org/W2984753899","https://openalex.org/W2783178962","https://openalex.org/W1896179566"],"abstract_inverted_index":{"File":[0],"fragment":[1,49],"classification":[2],"is":[3],"an":[4,135,141,159],"essential":[5],"problem":[6],"in":[7,161],"digital":[8],"forensics.":[9],"Although":[10],"several":[11],"attempts":[12],"had":[13],"been":[14,26],"made":[15],"to":[16,87,130],"solve":[17],"this":[18,29],"challenging":[19],"problem,":[20],"a":[21,33,77,96,114],"general":[22,56],"solution":[23],"has":[24],"not":[25],"found.":[27],"In":[28],"work,":[30],"we":[31,167],"propose":[32,76],"hierarchical":[34,89],"machine-learning-based":[35],"approach":[36,52],"with":[37,95,102,134,158],"optimized":[38],"support":[39],"vector":[40],"machines":[41],"(SVM)":[42],"as":[43],"the":[44,59,68,72,117,122,131,152,162,175,179],"base":[45],"classifiers":[46,57,66],"for":[47,80],"file":[48,81,100,110],"classification.":[50,90],"This":[51],"consists":[53],"of":[54,71,98,116,138,143,164,181],"more":[55,63],"at":[58,67],"top":[60],"level":[61],"and":[62,140,154,171],"specialized":[64],"fine-grain":[65],"lower":[69],"levels":[70],"hierarchy.":[73],"We":[74,91,148],"also":[75],"primitive":[78],"taxonomy":[79],"types":[82],"that":[83],"can":[84],"be":[85],"used":[86],"perform":[88],"evaluate":[92],"our":[93,169],"model":[94],"dataset":[97],"14":[99],"types,":[101],"1000":[103],"fragments":[104],"measuring":[105],"512":[106],"bytes":[107],"from":[108,113],"each":[109],"type":[111],"derived":[112],"subset":[115],"publicly":[118],"available":[119],"Digital":[120],"Corpora,":[121],"govdocs1":[123],"corpus.":[124],"Our":[125],"experiment":[126],"shows":[127],"comparable":[128],"results":[129],"present":[132],"literature,":[133],"average":[136],"accuracy":[137],"67.78%":[139],"F1-measure":[142,163],"65%":[144],"using":[145],"10-fold":[146],"cross-validation.":[147],"then":[149,173],"improve":[150],"on":[151],"hierarchy":[153],"find":[155],"better":[156],"results,":[157],"increase":[160],"1%.":[165],"Finally,":[166],"make":[168],"assessment":[170],"observations,":[172],"conclude":[174],"paper":[176],"by":[177],"discussing":[178],"scope":[180],"future":[182],"research.":[183]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2020-08-07T00:00:00"}
