{"id":"https://openalex.org/W7131651366","doi":"https://doi.org/10.1007/s10207-026-01235-z","title":"Toward AI-driven IoT cybersecurity: A preprocessing framework for benchmark datasets","display_name":"Toward AI-driven IoT cybersecurity: A preprocessing framework for benchmark datasets","publication_year":2026,"publication_date":"2026-02-26","ids":{"openalex":"https://openalex.org/W7131651366","doi":"https://doi.org/10.1007/s10207-026-01235-z"},"language":"en","primary_location":{"id":"doi:10.1007/s10207-026-01235-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10207-026-01235-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10207-026-01235-z.pdf","source":{"id":"https://openalex.org/S164062316","display_name":"International Journal of Information Security","issn_l":"1615-5262","issn":["1615-5262","1615-5270"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Information Security","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10207-026-01235-z.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123178155","display_name":"Virginia Martinez-Fuentes","orcid":null},"institutions":[{"id":"https://openalex.org/I46176106","display_name":"Universidad de Burgos","ror":"https://ror.org/049da5t36","country_code":"ES","type":"education","lineage":["https://openalex.org/I46176106"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Virginia Martinez-Fuentes","raw_affiliation_strings":["Applied Computational Intelligence Group (GICAP), Burgos, Spain","Department of Digitalization School of Engineering (Escuela Polit\u00e9cnica Superior), University of Burgos (Universidad de Burgos), Avda. Cantabria s/n, 09006, Burgos, Spain"],"raw_orcid":"https://orcid.org/0009-0007-7493-4059","affiliations":[{"raw_affiliation_string":"Applied Computational Intelligence Group (GICAP), Burgos, Spain","institution_ids":["https://openalex.org/I46176106"]},{"raw_affiliation_string":"Department of Digitalization School of Engineering (Escuela Polit\u00e9cnica Superior), University of Burgos (Universidad de Burgos), Avda. Cantabria s/n, 09006, Burgos, Spain","institution_ids":["https://openalex.org/I46176106"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123190883","display_name":"Angel Arroyo","orcid":null},"institutions":[{"id":"https://openalex.org/I46176106","display_name":"Universidad de Burgos","ror":"https://ror.org/049da5t36","country_code":"ES","type":"education","lineage":["https://openalex.org/I46176106"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Angel Arroyo","raw_affiliation_strings":["Applied Computational Intelligence Group (GICAP), Burgos, Spain","Department of Digitalization School of Engineering (Escuela Polit\u00e9cnica Superior), University of Burgos (Universidad de Burgos), Avda. Cantabria s/n, 09006, Burgos, Spain"],"raw_orcid":"https://orcid.org/0000-0002-1614-9075","affiliations":[{"raw_affiliation_string":"Applied Computational Intelligence Group (GICAP), Burgos, Spain","institution_ids":["https://openalex.org/I46176106"]},{"raw_affiliation_string":"Department of Digitalization School of Engineering (Escuela Polit\u00e9cnica Superior), University of Burgos (Universidad de Burgos), Avda. Cantabria s/n, 09006, Burgos, Spain","institution_ids":["https://openalex.org/I46176106"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037060212","display_name":"Diego Granados L\u00f3pez","orcid":null},"institutions":[{"id":"https://openalex.org/I4210103453","display_name":"Swift Solar (United States)","ror":"https://ror.org/0191qaw76","country_code":"US","type":"company","lineage":["https://openalex.org/I4210103453"]},{"id":"https://openalex.org/I46176106","display_name":"Universidad de Burgos","ror":"https://ror.org/049da5t36","country_code":"ES","type":"education","lineage":["https://openalex.org/I46176106"]}],"countries":["ES","US"],"is_corresponding":false,"raw_author_name":"Diego Granados L\u00f3pez","raw_affiliation_strings":["Department of Digitalization School of Engineering (Escuela Polit\u00e9cnica Superior), University of Burgos (Universidad de Burgos), Avda. Cantabria s/n, 09006, Burgos, Spain","Solar and Wind Feasibility Technologies (SWIFT), Burgos, Spain"],"raw_orcid":"https://orcid.org/0000-0002-9046-7397","affiliations":[{"raw_affiliation_string":"Department of Digitalization School of Engineering (Escuela Polit\u00e9cnica Superior), University of Burgos (Universidad de Burgos), Avda. Cantabria s/n, 09006, Burgos, Spain","institution_ids":["https://openalex.org/I46176106"]},{"raw_affiliation_string":"Solar and Wind Feasibility Technologies (SWIFT), Burgos, Spain","institution_ids":["https://openalex.org/I4210103453"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123211155","display_name":"Alvaro Herrero","orcid":null},"institutions":[{"id":"https://openalex.org/I46176106","display_name":"Universidad de Burgos","ror":"https://ror.org/049da5t36","country_code":"ES","type":"education","lineage":["https://openalex.org/I46176106"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Alvaro Herrero","raw_affiliation_strings":["Applied Computational Intelligence Group (GICAP), Burgos, Spain","Department of Digitalization School of Engineering (Escuela Polit\u00e9cnica Superior), University of Burgos (Universidad de Burgos), Avda. Cantabria s/n, 09006, Burgos, Spain"],"raw_orcid":"https://orcid.org/0000-0002-2444-5384","affiliations":[{"raw_affiliation_string":"Applied Computational Intelligence Group (GICAP), Burgos, Spain","institution_ids":["https://openalex.org/I46176106"]},{"raw_affiliation_string":"Department of Digitalization School of Engineering (Escuela Polit\u00e9cnica Superior), University of Burgos (Universidad de Burgos), Avda. Cantabria s/n, 09006, Burgos, Spain","institution_ids":["https://openalex.org/I46176106"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5123178155"],"corresponding_institution_ids":["https://openalex.org/I46176106"],"apc_list":{"value":2590,"currency":"EUR","value_usd":3190},"apc_paid":{"value":2590,"currency":"EUR","value_usd":3190},"fwci":21.2565,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.98731537,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"25","issue":"2","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.14959999918937683,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.14959999918937683,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.11739999800920486,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.043800000101327896,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.7426999807357788},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.7117999792098999},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.703499972820282},{"id":"https://openalex.org/keywords/data-pre-processing","display_name":"Data pre-processing","score":0.5740000009536743},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5679000020027161},{"id":"https://openalex.org/keywords/upsampling","display_name":"Upsampling","score":0.5273000001907349},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4932999908924103},{"id":"https://openalex.org/keywords/internet-of-things","display_name":"Internet of Things","score":0.44510000944137573}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8623999953269958},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.7426999807357788},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.7117999792098999},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.703499972820282},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5860999822616577},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5841000080108643},{"id":"https://openalex.org/C10551718","wikidata":"https://www.wikidata.org/wiki/Q5227332","display_name":"Data pre-processing","level":2,"score":0.5740000009536743},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5679000020027161},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5428000092506409},{"id":"https://openalex.org/C110384440","wikidata":"https://www.wikidata.org/wiki/Q1143270","display_name":"Upsampling","level":3,"score":0.5273000001907349},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4932999908924103},{"id":"https://openalex.org/C81860439","wikidata":"https://www.wikidata.org/wiki/Q251212","display_name":"Internet of Things","level":2,"score":0.44510000944137573},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4406000077724457},{"id":"https://openalex.org/C120894424","wikidata":"https://www.wikidata.org/wiki/Q1322871","display_name":"Exploratory data analysis","level":2,"score":0.38850000500679016},{"id":"https://openalex.org/C3018260909","wikidata":"https://www.wikidata.org/wiki/Q1322871","display_name":"Exploratory analysis","level":2,"score":0.3626999855041504},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.33980000019073486},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.3359000086784363},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.3343000113964081},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.32519999146461487},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C138827492","wikidata":"https://www.wikidata.org/wiki/Q6661985","display_name":"Data processing","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.2621999979019165},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.25600001215934753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10207-026-01235-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10207-026-01235-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10207-026-01235-z.pdf","source":{"id":"https://openalex.org/S164062316","display_name":"International Journal of Information Security","issn_l":"1615-5262","issn":["1615-5262","1615-5270"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Information Security","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10207-026-01235-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10207-026-01235-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10207-026-01235-z.pdf","source":{"id":"https://openalex.org/S164062316","display_name":"International Journal of Information Security","issn_l":"1615-5262","issn":["1615-5262","1615-5270"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Information Security","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4641926116","display_name":null,"funder_award_id":"C032.23","funder_id":"https://openalex.org/F4320327970","funder_display_name":"Instituto Nacional de Ciberseguridad"},{"id":"https://openalex.org/G8808062000","display_name":null,"funder_award_id":"COVID19","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320319138","display_name":"Universidad de Burgos","ror":"https://ror.org/049da5t36"},{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320327970","display_name":"Instituto Nacional de Ciberseguridad","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7131651366.pdf","grobid_xml":"https://content.openalex.org/works/W7131651366.grobid-xml"},"referenced_works_count":47,"referenced_works":["https://openalex.org/W2892556724","https://openalex.org/W2948211051","https://openalex.org/W2952298682","https://openalex.org/W2955014922","https://openalex.org/W2958285686","https://openalex.org/W2974232099","https://openalex.org/W2986458967","https://openalex.org/W3085955590","https://openalex.org/W3093621053","https://openalex.org/W3102359135","https://openalex.org/W3118198986","https://openalex.org/W3129369183","https://openalex.org/W3133060356","https://openalex.org/W3152804902","https://openalex.org/W3162956350","https://openalex.org/W3164796711","https://openalex.org/W3164964481","https://openalex.org/W3185349529","https://openalex.org/W3197995211","https://openalex.org/W4205887123","https://openalex.org/W4212986808","https://openalex.org/W4220685868","https://openalex.org/W4226319939","https://openalex.org/W4293812121","https://openalex.org/W4297152848","https://openalex.org/W4308627565","https://openalex.org/W4362704894","https://openalex.org/W4367319881","https://openalex.org/W4382128171","https://openalex.org/W4382281941","https://openalex.org/W4386784165","https://openalex.org/W4389328663","https://openalex.org/W4392120324","https://openalex.org/W4392747474","https://openalex.org/W4393217316","https://openalex.org/W4396773505","https://openalex.org/W4396993846","https://openalex.org/W4397004517","https://openalex.org/W4401989156","https://openalex.org/W4404890600","https://openalex.org/W4407145131","https://openalex.org/W4408100195","https://openalex.org/W4408866553","https://openalex.org/W4409535409","https://openalex.org/W4411536645","https://openalex.org/W4414029330","https://openalex.org/W7087721171"],"related_works":[],"abstract_inverted_index":{"The":[0,114],"rapid":[1],"expansion":[2],"of":[3,5,27,68,128,134,141,148,155,164,193],"Internet":[4],"Things":[6],"(IoT)":[7],"systems,":[8],"found":[9],"in":[10,33,199,205],"environments":[11],"such":[12],"as":[13],"smart":[14,206],"homes,":[15],"poses":[16],"growing":[17],"cybersecurity":[18,103],"challenges.":[19],"In":[20,71],"response,":[21],"research":[22],"has":[23],"examined":[24],"the":[25,65,69,110,177,191],"role":[26],"artificial":[28],"intelligence,":[29],"particularly":[30],"machine":[31,41,56],"learning,":[32],"enhancing":[34],"IoT":[35,102,200],"security.":[36],"To":[37],"support":[38],"this":[39,72,93,187],"effort,":[40],"learning":[42,57],"models":[43],"have":[44],"been":[45],"developed":[46],"and":[47,82,105,132,136,143,152,159],"evaluated":[48],"on":[49],"benchmark":[50],"datasets.":[51],"However,":[52],"preparing":[53],"datasets":[54,104,195],"for":[55,101,196],"requires":[58],"preprocessing":[59,87,99,161],"techniques":[60],"that":[61,175],"are":[62],"tailored":[63],"to":[64,90,109,170,190],"specific":[66],"characteristics":[67],"data.":[70],"context,":[73],"exploratory":[74,123],"data":[75,124],"analysis":[76,125,140],"provides":[77],"insights":[78],"into":[79,119],"dataset":[80,130,174],"structure":[81],"distribution,":[83],"thereby":[84],"supporting":[85],"informed":[86],"decisions":[88],"prior":[89],"modeling.":[91],"Accordingly,":[92],"study":[94,188],"introduces":[95],"a":[96,160,172,183],"reproducible":[97],"five-step":[98],"framework":[100,116],"demonstrates":[106],"its":[107],"application":[108],"NF-ToN-IoT":[111],"V1":[112],"dataset.":[113],"proposed":[115],"is":[117],"organized":[118],"two":[120],"phases:":[121],"an":[122],"phase":[126,162],"consisting":[127,163],"(1)":[129],"overview":[131],"identification":[133],"categorical":[135,149],"numerical":[137,156],"features,":[138],"(2)":[139],"missing":[142],"zero":[144],"values,":[145],"(3)":[146],"assessment":[147,154],"feature":[150,157],"distributions,":[151],"(4)":[153],"distributions;":[158],"(5)":[165],"proportional":[166],"stratified":[167],"random":[168],"downsampling":[169],"produce":[171],"reduced":[173],"preserves":[176],"original":[178],"class":[179],"distribution.":[180],"By":[181],"establishing":[182],"systematic,":[184],"data-driven":[185],"framework,":[186],"contributes":[189],"preparation":[192],"structured":[194],"attack":[197],"detection":[198],"environments,":[201],"with":[202],"potential":[203],"applications":[204],"homes.":[207]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-05-28T09:10:13.091523","created_date":"2026-02-27T00:00:00"}
