{"id":"https://openalex.org/W7117897182","doi":"https://doi.org/10.1109/milcom64451.2025.11310030","title":"CyberStack: Deep Reinforcement Learning in Stackelberg Games for Military Network Defense","display_name":"CyberStack: Deep Reinforcement Learning in Stackelberg Games for Military Network Defense","publication_year":2025,"publication_date":"2025-10-06","ids":{"openalex":"https://openalex.org/W7117897182","doi":"https://doi.org/10.1109/milcom64451.2025.11310030"},"language":null,"primary_location":{"id":"doi:10.1109/milcom64451.2025.11310030","is_oa":false,"landing_page_url":"https://doi.org/10.1109/milcom64451.2025.11310030","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"MILCOM 2025 - 2025 IEEE Military Communications Conference (MILCOM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102726323","display_name":"Aws Jaber","orcid":null},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Aws Jaber","raw_affiliation_strings":["KTH Royal Institute of Technology,Division of Network and Systems Engineering,Stockholm,Sweden"],"affiliations":[{"raw_affiliation_string":"KTH Royal Institute of Technology,Division of Network and Systems Engineering,Stockholm,Sweden","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083051879","display_name":"Angel Genchev","orcid":"https://orcid.org/0000-0002-0672-737X"},"institutions":[{"id":"https://openalex.org/I4210092588","display_name":"\"Professor Tsvetan Lazarov\" Defence Institute","ror":"https://ror.org/00fr2wv68","country_code":"BG","type":"government","lineage":["https://openalex.org/I4210092588"]}],"countries":["BG"],"is_corresponding":false,"raw_author_name":"Angel D. Genchev","raw_affiliation_strings":["Bulgarian Defence Institute,Directorate \"Development of C4I Systems\",Sofia,Bulgaria"],"affiliations":[{"raw_affiliation_string":"Bulgarian Defence Institute,Directorate \"Development of C4I Systems\",Sofia,Bulgaria","institution_ids":["https://openalex.org/I4210092588"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077910506","display_name":"Gudmund Grov","orcid":"https://orcid.org/0000-0001-8837-5496"},"institutions":[{"id":"https://openalex.org/I163244428","display_name":"Norwegian Defence Research Establishment","ror":"https://ror.org/0098gnz32","country_code":"NO","type":"facility","lineage":["https://openalex.org/I163244428"]}],"countries":["NO"],"is_corresponding":false,"raw_author_name":"Gudmund Grov","raw_affiliation_strings":["University of Oslo,Norwegian Defence Research Establishment (FFI),Kjeller,Norway"],"affiliations":[{"raw_affiliation_string":"University of Oslo,Norwegian Defence Research Establishment (FFI),Kjeller,Norway","institution_ids":["https://openalex.org/I163244428"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5099140526","display_name":"Tsvetelin Tsonev","orcid":null},"institutions":[{"id":"https://openalex.org/I4210092588","display_name":"\"Professor Tsvetan Lazarov\" Defence Institute","ror":"https://ror.org/00fr2wv68","country_code":"BG","type":"government","lineage":["https://openalex.org/I4210092588"]}],"countries":["BG"],"is_corresponding":false,"raw_author_name":"Tsvetelin Tsonev","raw_affiliation_strings":["Bulgarian Defence Institute,Directorate \"Development of C4I Systems\",Sofia,Bulgaria"],"affiliations":[{"raw_affiliation_string":"Bulgarian Defence Institute,Directorate \"Development of C4I Systems\",Sofia,Bulgaria","institution_ids":["https://openalex.org/I4210092588"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5102726323"],"corresponding_institution_ids":["https://openalex.org/I86987016"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.66949969,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"874","last_page":"875"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.3359000086784363,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.3359000086784363,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11807","display_name":"Infrastructure Resilience and Vulnerability Analysis","score":0.1574999988079071,"subfield":{"id":"https://openalex.org/subfields/2205","display_name":"Civil and Structural Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.15299999713897705,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stackelberg-competition","display_name":"Stackelberg competition","score":0.7275000214576721},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.677299976348877},{"id":"https://openalex.org/keywords/action-selection","display_name":"Action selection","score":0.5712000131607056},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5001999735832214},{"id":"https://openalex.org/keywords/blocking","display_name":"Blocking (statistics)","score":0.4984000027179718},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.44119998812675476},{"id":"https://openalex.org/keywords/bayesian-network","display_name":"Bayesian network","score":0.438400000333786},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.4284999966621399},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.42309999465942383}],"concepts":[{"id":"https://openalex.org/C199510392","wikidata":"https://www.wikidata.org/wiki/Q1184602","display_name":"Stackelberg competition","level":2,"score":0.7275000214576721},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.677299976348877},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6725999712944031},{"id":"https://openalex.org/C166109690","wikidata":"https://www.wikidata.org/wiki/Q4677422","display_name":"Action selection","level":3,"score":0.5712000131607056},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5001999735832214},{"id":"https://openalex.org/C144745244","wikidata":"https://www.wikidata.org/wiki/Q4927286","display_name":"Blocking (statistics)","level":2,"score":0.4984000027179718},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.492900013923645},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.44119998812675476},{"id":"https://openalex.org/C33724603","wikidata":"https://www.wikidata.org/wiki/Q812540","display_name":"Bayesian network","level":2,"score":0.438400000333786},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42879998683929443},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.4284999966621399},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.42309999465942383},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.41670000553131104},{"id":"https://openalex.org/C124119293","wikidata":"https://www.wikidata.org/wiki/Q6046081","display_name":"Interdiction","level":2,"score":0.3562999963760376},{"id":"https://openalex.org/C191267431","wikidata":"https://www.wikidata.org/wiki/Q911932","display_name":"Honeypot","level":2,"score":0.35409998893737793},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.3407999873161316},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C95713431","wikidata":"https://www.wikidata.org/wiki/Q631425","display_name":"Vulnerability (computing)","level":2,"score":0.31279999017715454},{"id":"https://openalex.org/C41065033","wikidata":"https://www.wikidata.org/wiki/Q2825412","display_name":"Adversary","level":2,"score":0.3111000061035156},{"id":"https://openalex.org/C192126672","wikidata":"https://www.wikidata.org/wiki/Q1068715","display_name":"Telecommunications network","level":2,"score":0.3012999892234802},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.3012000024318695},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.2806999981403351},{"id":"https://openalex.org/C182590292","wikidata":"https://www.wikidata.org/wiki/Q989632","display_name":"Network security","level":2,"score":0.28040000796318054},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.2603999972343445},{"id":"https://openalex.org/C20136886","wikidata":"https://www.wikidata.org/wiki/Q749647","display_name":"Interoperability","level":2,"score":0.2597000002861023},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.2524999976158142},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/milcom64451.2025.11310030","is_oa":false,"landing_page_url":"https://doi.org/10.1109/milcom64451.2025.11310030","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"MILCOM 2025 - 2025 IEEE Military Communications Conference (MILCOM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.5827393531799316,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320318377","display_name":"European Defence Fund","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W2145339207","https://openalex.org/W2907660552","https://openalex.org/W2952298682","https://openalex.org/W4250589301","https://openalex.org/W4389549215","https://openalex.org/W4411799826"],"related_works":[],"abstract_inverted_index":{"Securing":[0],"military":[1,94],"communication":[2],"networks":[3,95],"against":[4],"advanced":[5],"persistent":[6],"threats":[7],"(APTs)":[8],"is":[9],"critical":[10,97],"for":[11,93],"mission":[12],"success.":[13],"We":[14],"introduce":[15],"CyberStack,":[16],"a":[17,45,48,52,89],"cyber-defense":[18],"simulation":[19],"that":[20],"integrates":[21],"deep":[22,73],"reinforcement":[23],"learning":[24],"(DRL)":[25],"and":[26,47,69,78,96],"Stackelberg":[27],"Markov":[28],"Security":[29],"Games":[30],"(SMSG)":[31],"to":[32],"optimize":[33],"adaptive":[34],"defensive":[35],"strategies.":[36],"Leveraging":[37],"real-world":[38],"Suricata":[39],"EVE":[40],"JSON":[41],"logs,":[42],"CyberStack":[43],"models":[44],"defender":[46],"Bayesian":[49],"attacker":[50],"in":[51],"high-fidelity":[53],"cyber":[54],"range,":[55],"enabling":[56],"the":[57],"selection":[58],"of":[59,62],"optimal":[60],"Courses":[61],"Action":[63],"(CoAs),":[64],"such":[65],"as":[66],"IP":[67],"blocking":[68],"server":[70],"isolation.":[71],"A":[72],"RL":[74],"agent,":[75],"combining":[76],"Actor-Critic":[77],"Deep":[79],"Q-Network":[80],"(DQN)":[81],"models.":[82],"This":[83],"work":[84],"advances":[85],"AI-driven":[86],"cybersecurity,":[87],"offering":[88],"scalable":[90],"defense":[91],"mechanism":[92],"infrastructure.":[98]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-01-01T00:00:00"}
