{"id":"https://openalex.org/W4417003199","doi":"https://doi.org/10.1109/tsmc.2025.3636912","title":"Optimal Hybrid Transmission Strategy for Remote State Estimation With Deep Reinforcement Learning","display_name":"Optimal Hybrid Transmission Strategy for Remote State Estimation With Deep Reinforcement Learning","publication_year":2025,"publication_date":"2025-12-04","ids":{"openalex":"https://openalex.org/W4417003199","doi":"https://doi.org/10.1109/tsmc.2025.3636912"},"language":null,"primary_location":{"id":"doi:10.1109/tsmc.2025.3636912","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2025.3636912","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059396055","display_name":"Hongxia Rao","orcid":"https://orcid.org/0000-0002-4068-5986"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hongxia Rao","raw_affiliation_strings":["Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, School of Automation, Guangdong University of Technology, Guangzhou, China","School of Automation, Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, Guangdong University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, School of Automation, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]},{"raw_affiliation_string":"School of Automation, Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009279450","display_name":"Zhuzhou Li","orcid":"https://orcid.org/0009-0001-9019-1503"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zitian Li","raw_affiliation_strings":["Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, School of Automation, Guangdong University of Technology, Guangzhou, China","School of Automation, Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, Guangdong University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, School of Automation, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]},{"raw_affiliation_string":"School of Automation, Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034027393","display_name":"Lixin Yang","orcid":"https://orcid.org/0000-0001-6972-3272"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Lixin Yang","raw_affiliation_strings":["School of Electrical and Computer Engineering, National University of Singapore, Lower Kent Ridge Road, Singapore","School of Electrical and Computer Engineering, National University of Singapore, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, National University of Singapore, Lower Kent Ridge Road, Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"School of Electrical and Computer Engineering, National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044552537","display_name":"Yong Xu","orcid":"https://orcid.org/0000-0003-2219-7732"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Xu","raw_affiliation_strings":["Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, School of Automation, Guangdong University of Technology, Guangzhou, China","School of Automation, Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, Guangdong University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, School of Automation, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]},{"raw_affiliation_string":"School of Automation, Guangdong Provincial Key Laboratory of Intelligent Decision and Cooperative Control, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074290686","display_name":"Tingwen Huang","orcid":"https://orcid.org/0000-0001-9610-846X"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tingwen Huang","raw_affiliation_strings":["Faculty of Computer Science and Control Engineering, Shenzhen University of Advanced Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Computer Science and Control Engineering, Shenzhen University of Advanced Technology, Shenzhen, China","institution_ids":["https://openalex.org/I4210152380","https://openalex.org/I180726961"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043134796","display_name":"Leszek Rutkowski","orcid":"https://orcid.org/0000-0001-6960-9525"},"institutions":[{"id":"https://openalex.org/I686019","display_name":"AGH University of Krakow","ror":"https://ror.org/00bas1c41","country_code":"PL","type":"education","lineage":["https://openalex.org/I686019"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Leszek Rutkowski","raw_affiliation_strings":["AGH University, Krak&#x00F3;w, Poland"],"affiliations":[{"raw_affiliation_string":"AGH University, Krak&#x00F3;w, Poland","institution_ids":["https://openalex.org/I686019"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5059396055"],"corresponding_institution_ids":["https://openalex.org/I139024713"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.43558455,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"56","issue":"2","first_page":"849","last_page":"860"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.40470001101493835,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.40470001101493835,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12879","display_name":"Distributed Sensor Networks and Detection Algorithms","score":0.07930000126361847,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10080","display_name":"Energy Efficient Wireless Sensor Networks","score":0.05009999871253967,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7882000207901001},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.6707000136375427},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.5562000274658203},{"id":"https://openalex.org/keywords/transmission","display_name":"Transmission (telecommunications)","score":0.4869000017642975},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.4564000070095062},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4397999942302704},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.42820000648498535},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4242999851703644}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7882000207901001},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6794000267982483},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6707000136375427},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.5562000274658203},{"id":"https://openalex.org/C761482","wikidata":"https://www.wikidata.org/wiki/Q118093","display_name":"Transmission (telecommunications)","level":2,"score":0.4869000017642975},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.4564000070095062},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.44179999828338623},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4397999942302704},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.42820000648498535},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4242999851703644},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4106000065803528},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3919999897480011},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.39070001244544983},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.36980000138282776},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.34940001368522644},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3465999960899353},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.32670000195503235},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.3059000074863434},{"id":"https://openalex.org/C557945733","wikidata":"https://www.wikidata.org/wiki/Q389772","display_name":"Data transmission","level":2,"score":0.3009999990463257},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.2874000072479248},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.27649998664855957},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.26829999685287476},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2671000063419342}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsmc.2025.3636912","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2025.3636912","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1969403520","https://openalex.org/W2052334067","https://openalex.org/W2152520525","https://openalex.org/W2559563404","https://openalex.org/W2566133870","https://openalex.org/W2595507424","https://openalex.org/W2623956239","https://openalex.org/W2890604364","https://openalex.org/W2907662451","https://openalex.org/W2941097477","https://openalex.org/W2970144961","https://openalex.org/W2994803162","https://openalex.org/W2996540419","https://openalex.org/W3000486967","https://openalex.org/W3009323257","https://openalex.org/W3014928495","https://openalex.org/W3098044967","https://openalex.org/W3118347885","https://openalex.org/W3128363799","https://openalex.org/W3156666998","https://openalex.org/W3202065172","https://openalex.org/W4206480836","https://openalex.org/W4210319381","https://openalex.org/W4226110370","https://openalex.org/W4285166862","https://openalex.org/W4285262488","https://openalex.org/W4285288936","https://openalex.org/W4312692127","https://openalex.org/W4313165551","https://openalex.org/W4313839174","https://openalex.org/W4317496722","https://openalex.org/W4375929136","https://openalex.org/W4384787804","https://openalex.org/W4388262692","https://openalex.org/W4403936634"],"related_works":[],"abstract_inverted_index":{"This":[0,61],"work":[1],"delves":[2],"into":[3],"an":[4,97,128],"optimal":[5,98,129,142,168],"hybrid":[6,56],"transmission":[7,57,99],"strategy":[8,58,62,101],"for":[9],"remote":[10,29],"state":[11,25],"estimation":[12],"(RSE),":[13],"where":[14],"some":[15],"smart":[16,64],"sensors":[17,65],"observe":[18],"various":[19],"systems":[20],"and":[21,45,82,89,109,131,174],"transmit":[22],"their":[23],"local":[24],"estimates":[26],"to":[27,66,95,165],"a":[28,37,50,54,116,121,147],"estimator.":[30],"Inspired":[31],"by":[32,183],"the":[33,42,69,73,104,107,125,141,154,167,171,175,178],"high":[34],"bandwidth":[35],"of":[36,49,106,127,140,177],"high-frequency":[38],"(HF)":[39],"link":[40,71,75,108],"alongside":[41],"robust":[43],"reliability":[44],"low":[46],"energy":[47,83],"consumption":[48],"low-frequency":[51],"(LF)":[52],"link,":[53],"novel":[55],"is":[59,93,135,163],"proposed.":[60],"allows":[63],"utilize":[67],"either":[68],"HF":[70],"or":[72],"LF":[74],"dynamically,":[76],"each":[77],"with":[78],"distinct":[79],"channel":[80,110],"characteristics":[81,139],"consumption.":[84],"To":[85],"achieve":[86],"highly":[87],"reliable":[88],"energy-efficient":[90],"transmission,":[91],"it":[92],"imperative":[94],"devise":[96],"scheduling":[100],"that":[102],"dictates":[103],"selection":[105],"allocation.":[111],"Formulating":[112],"this":[113],"challenge":[114],"as":[115],"Markov":[117],"decision":[118],"process":[119],"(MDP),":[120],"sufficient":[122],"condition":[123],"ensuring":[124],"existence":[126],"deterministic":[130],"stationary":[132],"(ODS)":[133],"policy":[134,143],"established.":[136],"The":[137],"structural":[138,172],"are":[144,181],"derived.":[145],"Furthermore,":[146],"deep":[148,157],"reinforcement":[149],"learning":[150],"(DRL)":[151],"approach,":[152],"specifically":[153],"dueling":[155],"double":[156],"<italic":[158],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[159],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Q</i>-network":[160],"(D3QN)":[161],"algorithm,":[162],"employed":[164],"approximate":[166],"policy.":[169],"Finally,":[170],"results":[173],"effectiveness":[176],"DRL":[179],"algorithm":[180],"verified":[182],"simulation":[184],"examples.":[185]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-04T00:00:00"}
