{"id":"https://openalex.org/W4386449998","doi":"https://doi.org/10.1109/iccc57788.2023.10233612","title":"Deep Reinforcement Learning for Network Security Applications With A Safety Guide","display_name":"Deep Reinforcement Learning for Network Security Applications With A Safety Guide","publication_year":2023,"publication_date":"2023-08-10","ids":{"openalex":"https://openalex.org/W4386449998","doi":"https://doi.org/10.1109/iccc57788.2023.10233612"},"language":"en","primary_location":{"id":"doi:10.1109/iccc57788.2023.10233612","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccc57788.2023.10233612","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE/CIC International Conference on Communications in China (ICCC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100748265","display_name":"Zhibo Liu","orcid":"https://orcid.org/0000-0001-9210-156X"},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhibo Liu","raw_affiliation_strings":["Nanjing University of Aeronautics and Astronautics,College of Computer Science and Technology,Nanjing,China","College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Aeronautics and Astronautics,College of Computer Science and Technology,Nanjing,China","institution_ids":["https://openalex.org/I9842412"]},{"raw_affiliation_string":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091024726","display_name":"Xiaozhen Lu","orcid":"https://orcid.org/0000-0001-8247-0353"},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaozhen Lu","raw_affiliation_strings":["Nanjing University of Aeronautics and Astronautics,College of Computer Science and Technology,Nanjing,China","College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Aeronautics and Astronautics,College of Computer Science and Technology,Nanjing,China","institution_ids":["https://openalex.org/I9842412"]},{"raw_affiliation_string":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100650500","display_name":"Yuhan Chen","orcid":"https://orcid.org/0000-0001-9796-0291"},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhan Chen","raw_affiliation_strings":["Nanjing University of Aeronautics and Astronautics,College of Computer Science and Technology,Nanjing,China","College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Aeronautics and Astronautics,College of Computer Science and Technology,Nanjing,China","institution_ids":["https://openalex.org/I9842412"]},{"raw_affiliation_string":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China","institution_ids":["https://openalex.org/I9842412"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102921648","display_name":"Yilin Xiao","orcid":"https://orcid.org/0000-0002-0717-7488"},"institutions":[{"id":"https://openalex.org/I4210104064","display_name":"Shenzhen Academy of Robotics","ror":"https://ror.org/01h027j09","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210104064"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yilin Xiao","raw_affiliation_strings":["Shenzhen Institute of Artificial Intelligence and Robotics for Society,Shenzhen,China","Shenzhen Institute of Artificial Intelligence and Robotics for Society, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institute of Artificial Intelligence and Robotics for Society,Shenzhen,China","institution_ids":["https://openalex.org/I4210104064"]},{"raw_affiliation_string":"Shenzhen Institute of Artificial Intelligence and Robotics for Society, Shenzhen, China","institution_ids":["https://openalex.org/I4210104064"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068976123","display_name":"Liang Xiao","orcid":"https://orcid.org/0000-0003-2402-611X"},"institutions":[{"id":"https://openalex.org/I191208505","display_name":"Xiamen University","ror":"https://ror.org/00mcjh785","country_code":"CN","type":"education","lineage":["https://openalex.org/I191208505"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Xiao","raw_affiliation_strings":["Xiamen University,Department of Informatics and Communication Engineering,Xiamen,China","Department of Informatics and Communication Engineering, Xiamen University, Xiamen, China"],"affiliations":[{"raw_affiliation_string":"Xiamen University,Department of Informatics and Communication Engineering,Xiamen,China","institution_ids":["https://openalex.org/I191208505"]},{"raw_affiliation_string":"Department of Informatics and Communication Engineering, Xiamen University, Xiamen, China","institution_ids":["https://openalex.org/I191208505"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077407278","display_name":"Yanling Bu","orcid":"https://orcid.org/0000-0001-8207-1125"},"institutions":[{"id":"https://openalex.org/I9842412","display_name":"Nanjing University of Aeronautics and Astronautics","ror":"https://ror.org/01scyh794","country_code":"CN","type":"education","lineage":["https://openalex.org/I9842412"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanling Bu","raw_affiliation_strings":["Nanjing University of Aeronautics and Astronautics,College of Computer Science and Technology,Nanjing,China","College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Aeronautics and Astronautics,College of Computer Science and Technology,Nanjing,China","institution_ids":["https://openalex.org/I9842412"]},{"raw_affiliation_string":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China","institution_ids":["https://openalex.org/I9842412"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100748265"],"corresponding_institution_ids":["https://openalex.org/I9842412"],"apc_list":null,"apc_paid":null,"fwci":0.1876,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.46967269,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10917","display_name":"Smart Grid Security and Resilience","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10917","display_name":"Smart Grid Security and Resilience","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8987899422645569},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7074494957923889},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.5819424390792847},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5033339858055115},{"id":"https://openalex.org/keywords/warning-system","display_name":"Warning system","score":0.47257673740386963},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.4583846926689148},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43068674206733704},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4284816384315491},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4085894525051117},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38575422763824463},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.3710656464099884},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.11015096306800842}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8987899422645569},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7074494957923889},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.5819424390792847},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5033339858055115},{"id":"https://openalex.org/C29825287","wikidata":"https://www.wikidata.org/wiki/Q1427940","display_name":"Warning system","level":2,"score":0.47257673740386963},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.4583846926689148},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43068674206733704},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4284816384315491},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4085894525051117},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38575422763824463},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.3710656464099884},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.11015096306800842},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccc57788.2023.10233612","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccc57788.2023.10233612","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE/CIC International Conference on Communications in China (ICCC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Climate action","score":0.6000000238418579,"id":"https://metadata.un.org/sdg/13"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322769","display_name":"Natural Science Foundation of Jiangsu Province","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1845972764","https://openalex.org/W2145339207","https://openalex.org/W2522489477","https://openalex.org/W2736601468","https://openalex.org/W2939467494","https://openalex.org/W2963864421","https://openalex.org/W2964043796","https://openalex.org/W3037804676","https://openalex.org/W3040914594","https://openalex.org/W3131625919","https://openalex.org/W3176452384","https://openalex.org/W4210882709","https://openalex.org/W4226071704","https://openalex.org/W4306705058","https://openalex.org/W4312890427","https://openalex.org/W4313053314","https://openalex.org/W6684921986","https://openalex.org/W6692846177","https://openalex.org/W6741002519","https://openalex.org/W6780312303","https://openalex.org/W6838865717","https://openalex.org/W6846122673"],"related_works":["https://openalex.org/W1985560493","https://openalex.org/W2386410636","https://openalex.org/W1626977535","https://openalex.org/W2341346307","https://openalex.org/W3168977894","https://openalex.org/W3096874164","https://openalex.org/W2357975469","https://openalex.org/W4400868993","https://openalex.org/W2937181779","https://openalex.org/W2145363145"],"abstract_inverted_index":{"Most":[0],"of":[1,121,211],"the":[2,11,16,25,30,60,84,93,103,113,119,130,136,141,147,157,163,177,185,195,205,209,216],"typical":[3],"reinforcement":[4,48],"learning":[5,49,61,187],"algorithms":[6],"help":[7],"wireless":[8],"devices":[9],"choose":[10,83],"security":[12],"policy":[13,21,85,95],"such":[14],"as":[15],"moving":[17],"strategy":[18],"and":[19,86,125,140,172],"communication":[20],"by":[22,146],"exploring":[23,65],"all":[24],"possible":[26],"state-action":[27,123],"pairs":[28],"including":[29],"risky":[31,66,174],"policies":[32],"that":[33,96,111,128],"cause":[34],"a":[35,46,73,78,88,107,126,152,169,173,190,199],"severe":[36],"collision":[37],"or":[38,77],"network":[39,76],"disaster.":[40],"In":[41],"this":[42,149],"paper,":[43],"we":[44,193],"design":[45],"safe":[47,170,218],"algorithm":[50,69,150,161,197,213],"for":[51,176],"safety-critical":[52],"applications":[53],"(e.g.,":[54],"intelligent":[55],"transportation":[56,201],"systems)":[57],"to":[58,63,82,91,118,155,167,180],"guide":[59,90,105],"agent":[62],"avoid":[64],"policies.":[67],"This":[68,160],"uses":[70,151,162],"Q-network":[71],"(i.e.,":[72],"convolutional":[74],"neural":[75,80],"deep":[79,219],"network)":[81],"designs":[87],"safety":[89,104,153],"modify":[92,156],"chosen":[94,158],"results":[97,207],"in":[98,184,198,203],"dangerous":[99],"status.":[100],"More":[101],"specifically,":[102],"includes":[106],"risk":[108,120,132,138],"alarm":[109],"module":[110],"evaluates":[112],"immediate":[114,164],"warning":[115,165],"value":[116,139,166],"corresponding":[117],"each":[122],"pair":[124],"G-network":[127,178],"estimates":[129],"long-term":[131,137,142],"value.":[133],"By":[134],"adding":[135],"expected":[143],"reward":[144],"output":[145],"Q-network,":[148],"dock":[154],"policy.":[159],"formulate":[168],"buffer":[171,175],"updating":[179],"ensure":[181],"fully":[182],"exploration":[183],"initial":[186],"process.":[188],"As":[189],"case":[191],"study,":[192],"apply":[194],"designed":[196],"cargo":[200],"system,":[202],"which":[204],"experimental":[206],"verify":[208],"effectiveness":[210],"our":[212],"compared":[214],"with":[215],"benchmark":[217],"Q-network.":[220]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
