{"id":"https://openalex.org/W4415133278","doi":"https://doi.org/10.48550/arxiv.2506.02438","title":"A Review of Various Datasets for Machine Learning Algorithm-Based Intrusion Detection System: Advances and Challenges","display_name":"A Review of Various Datasets for Machine Learning Algorithm-Based Intrusion Detection System: Advances and Challenges","publication_year":2025,"publication_date":"2025-06-03","ids":{"openalex":"https://openalex.org/W4415133278","doi":"https://doi.org/10.48550/arxiv.2506.02438"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2506.02438","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.02438","pdf_url":"https://arxiv.org/pdf/2506.02438","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2506.02438","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028436957","display_name":"S. Tripathy","orcid":"https://orcid.org/0000-0002-6204-4258"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tripathy, Sudhanshu Sekhar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5109209815","display_name":"Biswajit Behera","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Behera, Bichitrananda","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9017000198364258,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/intrusion-detection-system","display_name":"Intrusion detection system","score":0.7192000150680542},{"id":"https://openalex.org/keywords/confidentiality","display_name":"Confidentiality","score":0.5494999885559082},{"id":"https://openalex.org/keywords/network-security","display_name":"Network security","score":0.3937000036239624},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.3903000056743622},{"id":"https://openalex.org/keywords/intrusion","display_name":"Intrusion","score":0.373199999332428},{"id":"https://openalex.org/keywords/globe","display_name":"Globe","score":0.2897000014781952}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7681000232696533},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.7275999784469604},{"id":"https://openalex.org/C35525427","wikidata":"https://www.wikidata.org/wiki/Q745881","display_name":"Intrusion detection system","level":2,"score":0.7192000150680542},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6700000166893005},{"id":"https://openalex.org/C71745522","wikidata":"https://www.wikidata.org/wiki/Q2476929","display_name":"Confidentiality","level":2,"score":0.5494999885559082},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.40149998664855957},{"id":"https://openalex.org/C182590292","wikidata":"https://www.wikidata.org/wiki/Q989632","display_name":"Network security","level":2,"score":0.3937000036239624},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3903000056743622},{"id":"https://openalex.org/C158251709","wikidata":"https://www.wikidata.org/wiki/Q354025","display_name":"Intrusion","level":2,"score":0.373199999332428},{"id":"https://openalex.org/C2775899829","wikidata":"https://www.wikidata.org/wiki/Q3109007","display_name":"Globe","level":2,"score":0.2897000014781952},{"id":"https://openalex.org/C527648132","wikidata":"https://www.wikidata.org/wiki/Q189900","display_name":"Information security","level":2,"score":0.2793000042438507},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.27070000767707825},{"id":"https://openalex.org/C27061796","wikidata":"https://www.wikidata.org/wiki/Q745881","display_name":"Intrusion prevention system","level":3,"score":0.25999999046325684},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.2551000118255615},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.25200000405311584},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2502000033855438}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2506.02438","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.02438","pdf_url":"https://arxiv.org/pdf/2506.02438","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2506.02438","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2506.02438","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2506.02438","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.02438","pdf_url":"https://arxiv.org/pdf/2506.02438","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4415133278.pdf","grobid_xml":"https://content.openalex.org/works/W4415133278.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"IDS":[0,82,232],"aims":[1],"to":[2,16],"protect":[3,21],"computer":[4],"networks":[5,40],"from":[6],"security":[7,98],"threats":[8],"by":[9,83,102],"detecting,":[10],"notifying,":[11],"and":[12,20,32,39,55,72,116,122,137,162,169,189,204,221],"taking":[13],"appropriate":[14],"action":[15],"prevent":[17],"illegal":[18],"access":[19],"confidential":[22],"information.":[23],"As":[24],"the":[25,45,61,64,68,79,112,124,149,199,202,212],"globe":[26],"becomes":[27],"increasingly":[28],"dependent":[29],"on":[30,133,153],"technology":[31,57],"automated":[33],"processes,":[34],"ensuring":[35],"secured":[36],"systems,":[37],"applications,":[38],"has":[41,145],"become":[42],"one":[43],"of":[44,49,63,70,81,114,131,174,195,201],"most":[46],"significant":[47],"problems":[48],"this":[50],"era.":[51],"The":[52],"global":[53],"web":[54],"digital":[56],"have":[58],"significantly":[59],"accelerated":[60],"evolution":[62],"modern":[65],"world,":[66],"necessitating":[67],"use":[69,180],"telecommunications":[71],"data":[73],"transfer":[74],"platforms.":[75],"Researchers":[76],"are":[77],"enhancing":[78],"effectiveness":[80],"incorporating":[84],"popular":[85],"datasets":[86,127,213],"into":[87],"machine":[88,94,134],"learning":[89,95,135,139],"algorithms.":[90],"IDS,":[91],"equipped":[92],"with":[93],"classifiers,":[96],"enhances":[97],"attack":[99],"detection":[100,119,143,177],"accuracy":[101],"identifying":[103],"normal":[104],"or":[105],"abnormal":[106],"network":[107],"traffic.":[108],"This":[109,224],"paper":[110],"explores":[111],"methods":[113,178],"capturing":[115],"reviewing":[117],"intrusion":[118,142,176],"systems":[120],"(IDS)":[121],"evaluates":[123],"challenges":[125],"existing":[126],"face.":[128],"A":[129,207],"deluge":[130],"research":[132],"(ML)":[136],"deep":[138],"(DL)":[140],"architecture-based":[141],"techniques":[144],"been":[146],"conducted":[147,165],"in":[148],"past":[150],"ten":[151],"years":[152],"various":[154,175],"cybersecurity":[155],"datasets,":[156],"including":[157],"KDDCUP'99,":[158],"NSL-KDD,":[159],"UNSW-NB15,":[160],"CICIDS-2017,":[161],"CSE-CIC-IDS2018.":[163],"We":[164,191],"a":[166,227],"literature":[167],"review":[168,229],"presented":[170],"an":[171,193],"in-depth":[172],"analysis":[173,210],"that":[179],"SVM,":[181],"KNN,":[182],"DT,":[183],"LR,":[184],"NB,":[185],"RF,":[186],"XGBOOST,":[187],"Adaboost,":[188],"ANN.":[190],"provide":[192],"overview":[194],"each":[196],"technique,":[197],"explaining":[198],"role":[200],"classifiers":[203,215],"algorithms":[205],"used.":[206],"detailed":[208],"tabular":[209],"highlights":[211],"used,":[214],"employed,":[216],"attacks":[217],"detected,":[218],"evaluation":[219],"metrics,":[220],"conclusions":[222],"drawn.":[223],"article":[225],"offers":[226],"thorough":[228],"for":[230],"future":[231],"research.":[233]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-14T00:00:00"}
