{"id":"https://openalex.org/W4360995553","doi":"https://doi.org/10.1109/tiv.2023.3262132","title":"Event-Triggered Deep Reinforcement Learning Using Parallel Control: A Case Study in Autonomous Driving","display_name":"Event-Triggered Deep Reinforcement Learning Using Parallel Control: A Case Study in Autonomous Driving","publication_year":2023,"publication_date":"2023-03-27","ids":{"openalex":"https://openalex.org/W4360995553","doi":"https://doi.org/10.1109/tiv.2023.3262132"},"language":"en","primary_location":{"id":"doi:10.1109/tiv.2023.3262132","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2023.3262132","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033954140","display_name":"Jingwei Lu","orcid":"https://orcid.org/0000-0001-5789-3522"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112270","display_name":"Qingdao Academy of Intelligent Industries","ror":"https://ror.org/02a0rnh86","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210112270"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingwei Lu","raw_affiliation_strings":["Parallel Intelligence Innovation Research Center, Qingdao Academy of Intelligent Industries, Qingdao, China","State Key Laboratory for Management and Control of Complex Systems, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Parallel Intelligence Innovation Research Center, Qingdao Academy of Intelligent Industries, Qingdao, China","institution_ids":["https://openalex.org/I4210112270"]},{"raw_affiliation_string":"State Key Laboratory for Management and Control of Complex Systems, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101561534","display_name":"Liyuan Han","orcid":"https://orcid.org/0000-0003-3535-4258"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liyuan Han","raw_affiliation_strings":["State Key Laboratory for Management and Control of Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Management and Control of Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087825639","display_name":"Qinglai Wei","orcid":"https://orcid.org/0000-0001-7002-9800"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qinglai Wei","raw_affiliation_strings":["State Key Laboratory for Management and Control of Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Management and Control of Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112719601","display_name":"Xiao Wang","orcid":"https://orcid.org/0000-0002-0008-0659"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]},{"id":"https://openalex.org/I4210112270","display_name":"Qingdao Academy of Intelligent Industries","ror":"https://ror.org/02a0rnh86","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210112270"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Wang","raw_affiliation_strings":["School of Artificial Intelligence, Anhui University, Hefei, China","Qingdao Academy of Intelligent Industries, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"Qingdao Academy of Intelligent Industries, Qingdao, China","institution_ids":["https://openalex.org/I4210112270"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057269411","display_name":"Xingyuan Dai","orcid":"https://orcid.org/0000-0001-7517-5049"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingyuan Dai","raw_affiliation_strings":["State Key Laboratory for Management and Control of Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Management and Control of Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5113600509","display_name":"Fei\u2010Yue Wang","orcid":"https://orcid.org/0000-0001-9185-3989"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei-Yue Wang","raw_affiliation_strings":["State Key Laboratory for Management and Control of Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Management and Control of Complex Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5033954140"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210112270"],"apc_list":null,"apc_paid":null,"fwci":16.5314,"has_fulltext":false,"cited_by_count":96,"citation_normalized_percentile":{"value":0.99428391,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"8","issue":"4","first_page":"2821","last_page":"2831"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9811999797821045,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8457475900650024},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.7528876066207886},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7487970590591431},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.6164700984954834},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.6105550527572632},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.587332546710968},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.514644980430603},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5020012855529785},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.5007627010345459},{"id":"https://openalex.org/keywords/realization","display_name":"Realization (probability)","score":0.5003829002380371},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.43766531348228455},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4268166124820709},{"id":"https://openalex.org/keywords/value-network","display_name":"Value network","score":0.42346620559692383},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32017165422439575},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.30593764781951904},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.12486940622329712},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10338437557220459},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09730538725852966},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.08426588773727417}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8457475900650024},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.7528876066207886},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7487970590591431},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.6164700984954834},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.6105550527572632},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.587332546710968},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.514644980430603},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5020012855529785},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.5007627010345459},{"id":"https://openalex.org/C2781089630","wikidata":"https://www.wikidata.org/wiki/Q21856745","display_name":"Realization (probability)","level":2,"score":0.5003829002380371},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.43766531348228455},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4268166124820709},{"id":"https://openalex.org/C89249532","wikidata":"https://www.wikidata.org/wiki/Q7912758","display_name":"Value network","level":3,"score":0.42346620559692383},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32017165422439575},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.30593764781951904},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.12486940622329712},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10338437557220459},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09730538725852966},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.08426588773727417},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C4216890","wikidata":"https://www.wikidata.org/wiki/Q815823","display_name":"Business model","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tiv.2023.3262132","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2023.3262132","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8100000023841858,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1972107234","https://openalex.org/W1978518835","https://openalex.org/W2133747588","https://openalex.org/W2145339207","https://openalex.org/W2201581102","https://openalex.org/W2332672415","https://openalex.org/W2361439446","https://openalex.org/W2404399993","https://openalex.org/W2460713275","https://openalex.org/W2724169821","https://openalex.org/W2738419683","https://openalex.org/W2746553466","https://openalex.org/W2761873684","https://openalex.org/W2889856497","https://openalex.org/W2951799221","https://openalex.org/W2953303875","https://openalex.org/W2955358943","https://openalex.org/W2964043796","https://openalex.org/W2981207549","https://openalex.org/W2981402159","https://openalex.org/W2989958156","https://openalex.org/W3016409148","https://openalex.org/W3090027660","https://openalex.org/W3097662863","https://openalex.org/W3100789280","https://openalex.org/W3101086659","https://openalex.org/W3127561923","https://openalex.org/W3128395826","https://openalex.org/W3151151945","https://openalex.org/W3159959744","https://openalex.org/W3203162172","https://openalex.org/W3212958986","https://openalex.org/W4200045037","https://openalex.org/W4226239849","https://openalex.org/W4229057997","https://openalex.org/W4285272860","https://openalex.org/W4298876402","https://openalex.org/W4310875027","https://openalex.org/W4311409157","https://openalex.org/W4312081468","https://openalex.org/W4312769831","https://openalex.org/W4388286312","https://openalex.org/W6683300800","https://openalex.org/W6685444567","https://openalex.org/W6687681856","https://openalex.org/W6692846177","https://openalex.org/W6740092555","https://openalex.org/W6841694480"],"related_works":["https://openalex.org/W4400868993","https://openalex.org/W3096874164","https://openalex.org/W1985560493","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W2341346307","https://openalex.org/W3168977894","https://openalex.org/W2315999538"],"abstract_inverted_index":{"This":[0],"paper":[1],"utilizes":[2],"parallel":[3,40],"control":[4,56,65,101],"to":[5,76,104,130,157,182],"investigate":[6],"the":[7,37,42,50,60,63,69,73,78,84,95,98,106,110,118,122,127,133,150,160,178,194],"problem":[8],"of":[9,23,39,47,62,97,109,117,165],"event-triggered":[10,17,162,192],"deep":[11,18,144,184],"reinforcement":[12],"learning":[13],"and":[14,52,72,121,154,200],"develops":[15],"an":[16,30,169],"Q-network":[19,145],"(ETDQN)":[20],"for":[21],"decision-making":[22,163],"autonomous":[24,166],"driving,":[25],"<italic":[26],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[27],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">without":[28],"training":[29],"explicit":[31,170],"triggering":[32,171],"condition</i>":[33],".":[34],"Based":[35],"on":[36,141],"framework":[38],"control,":[41,193],"developed":[43,99,128,179,195],"ETDQN":[44,129,180,196],"incorporates":[45],"information":[46,116],"actions":[48],"into":[49],"feedback":[51],"constructs":[53],"a":[54],"dynamic":[55,64,100],"policy.":[57],"First,":[58],"in":[59,191],"realization":[61],"policy,":[66],"we":[67,148],"integrate":[68],"current":[70,119],"state":[71,80,114,120],"previous":[74,123],"action":[75],"construct":[77],"augmented":[79,85,113,151],"as":[81,83],"well":[82],"Markov":[86],"decision":[87],"process.":[88],"Meanwhile,":[89],"it":[90],"is":[91,103,174],"shown":[92],"theoretically":[93],"that":[94,177],"goal":[96],"policy":[102,164],"learn":[105,159],"variation":[107],"rate":[108],"action.":[111],"The":[112],"contains":[115],"action,":[124],"which":[125],"enables":[126],"directly":[131,158],"design":[132],"immediate":[134],"reward":[135],"considering":[136],"communication":[137,202],"loss.":[138],"Then,":[139],"based":[140],"dueling":[142,198],"double":[143],"(dueling":[146],"DDQN),":[147],"establish":[149],"action-value,":[152],"value,":[153],"advantage":[155],"functions":[156],"optimal":[161],"driving":[167],"without":[168],"condition.":[172],"It":[173],"worth":[175],"noticing":[176],"applies":[181],"various":[183],"Q-networks":[185],"(DQNs).":[186],"Empirical":[187],"results":[188],"demonstrate":[189],"that,":[190],"outperforms":[197],"DDQN":[199],"reduces":[201],"loss":[203],"effectively.":[204]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":36},{"year":2024,"cited_by_count":36},{"year":2023,"cited_by_count":19}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
