{"id":"https://openalex.org/W3174572831","doi":"https://doi.org/10.1109/jstsp.2021.3091842","title":"Shallow Reinforcement Learning for Energy Harvesting Communications With Imperfect Channel Knowledge","display_name":"Shallow Reinforcement Learning for Energy Harvesting Communications With Imperfect Channel Knowledge","publication_year":2021,"publication_date":"2021-06-23","ids":{"openalex":"https://openalex.org/W3174572831","doi":"https://doi.org/10.1109/jstsp.2021.3091842","mag":"3174572831"},"language":"en","primary_location":{"id":"doi:10.1109/jstsp.2021.3091842","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2021.3091842","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5042930561","display_name":"Heasung Kim","orcid":"https://orcid.org/0000-0003-3860-8962"},"institutions":[{"id":"https://openalex.org/I57664883","display_name":"Ajou University","ror":"https://ror.org/03tzb2h73","country_code":"KR","type":"education","lineage":["https://openalex.org/I57664883"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Heasung Kim","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Ajou University, Suwon, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Ajou University, Suwon, South Korea","institution_ids":["https://openalex.org/I57664883"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100376261","display_name":"Jungwoo Lee","orcid":"https://orcid.org/0000-0002-6804-980X"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jungwoo Lee","raw_affiliation_strings":["Communications and Machine Learning Laboratory, Department of Electrical and Computer Engineering, Seoul National University, Seoul, South Korea"],"affiliations":[{"raw_affiliation_string":"Communications and Machine Learning Laboratory, Department of Electrical and Computer Engineering, Seoul National University, Seoul, South Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009725517","display_name":"Wonjae Shin","orcid":"https://orcid.org/0000-0001-6513-1237"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]},{"id":"https://openalex.org/I57664883","display_name":"Ajou University","ror":"https://ror.org/03tzb2h73","country_code":"KR","type":"education","lineage":["https://openalex.org/I57664883"]}],"countries":["KR","US"],"is_corresponding":false,"raw_author_name":"Wonjae Shin","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Ajou University, Suwon, South Korea","Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Ajou University, Suwon, South Korea","institution_ids":["https://openalex.org/I57664883"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042307561","display_name":"H. Vincent Poor","orcid":"https://orcid.org/0000-0002-2062-131X"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"H. Vincent Poor","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Princeton University, Princeton, NJ, USA","institution_ids":["https://openalex.org/I20089843"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5042930561"],"corresponding_institution_ids":["https://openalex.org/I57664883"],"apc_list":null,"apc_paid":null,"fwci":0.1012,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.42010419,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"15","issue":"5","first_page":"1258","last_page":"1271"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11230","display_name":"Innovative Energy Harvesting Technologies","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8566733598709106},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7829619646072388},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6877262592315674},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5830401182174683},{"id":"https://openalex.org/keywords/monotonic-function","display_name":"Monotonic function","score":0.5563445091247559},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.48266011476516724},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4545906186103821},{"id":"https://openalex.org/keywords/imperfect","display_name":"Imperfect","score":0.41412651538848877},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3182072341442108},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.14249363541603088},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11216381192207336}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8566733598709106},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7829619646072388},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6877262592315674},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5830401182174683},{"id":"https://openalex.org/C72169020","wikidata":"https://www.wikidata.org/wiki/Q194404","display_name":"Monotonic function","level":2,"score":0.5563445091247559},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.48266011476516724},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4545906186103821},{"id":"https://openalex.org/C2780310539","wikidata":"https://www.wikidata.org/wiki/Q12547192","display_name":"Imperfect","level":2,"score":0.41412651538848877},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3182072341442108},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.14249363541603088},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11216381192207336},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jstsp.2021.3091842","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jstsp.2021.3091842","pdf_url":null,"source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.8600000143051147,"id":"https://metadata.un.org/sdg/7"}],"awards":[{"id":"https://openalex.org/G7920959503","display_name":null,"funder_award_id":"CCF-1908308","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G873822990","display_name":null,"funder_award_id":"NRF5199991514504","funder_id":"https://openalex.org/F4320312071","funder_display_name":"Ministry of Education, Libya"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320312071","display_name":"Ministry of Education, Libya","ror":"https://ror.org/02w030k33"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W389907844","https://openalex.org/W1520252399","https://openalex.org/W1522301498","https://openalex.org/W1533861849","https://openalex.org/W1556911442","https://openalex.org/W1757796397","https://openalex.org/W1794490453","https://openalex.org/W2031183328","https://openalex.org/W2031440489","https://openalex.org/W2035229442","https://openalex.org/W2058159521","https://openalex.org/W2065154528","https://openalex.org/W2081751842","https://openalex.org/W2091633261","https://openalex.org/W2099111195","https://openalex.org/W2101600135","https://openalex.org/W2119567691","https://openalex.org/W2120686080","https://openalex.org/W2145834571","https://openalex.org/W2155027007","https://openalex.org/W2163754837","https://openalex.org/W2173248099","https://openalex.org/W2215378786","https://openalex.org/W2248060815","https://openalex.org/W2325147653","https://openalex.org/W2490752264","https://openalex.org/W2521805807","https://openalex.org/W2614312052","https://openalex.org/W2781726626","https://openalex.org/W2797527950","https://openalex.org/W2915095714","https://openalex.org/W2939455399","https://openalex.org/W2949561945","https://openalex.org/W2953148557","https://openalex.org/W2963864421","https://openalex.org/W2964121744","https://openalex.org/W2979897999","https://openalex.org/W3080594196","https://openalex.org/W3088912578","https://openalex.org/W3104547250","https://openalex.org/W3104974366","https://openalex.org/W3121332813","https://openalex.org/W4233840023","https://openalex.org/W4298857966","https://openalex.org/W4394672593","https://openalex.org/W6631190155","https://openalex.org/W6631943919","https://openalex.org/W6637967152","https://openalex.org/W6683204974","https://openalex.org/W6684921986","https://openalex.org/W6690771958","https://openalex.org/W6734517396","https://openalex.org/W6747473740","https://openalex.org/W6750629867"],"related_works":["https://openalex.org/W2374250903","https://openalex.org/W2077314575","https://openalex.org/W4315701745","https://openalex.org/W1990290471","https://openalex.org/W4380682190","https://openalex.org/W2005710836","https://openalex.org/W2102386043","https://openalex.org/W2945307361","https://openalex.org/W1987764909","https://openalex.org/W2116636209"],"abstract_inverted_index":{"This":[0],"study":[1],"aims":[2],"to":[3,9,20,41,57,75,117,136,181],"address":[4],"the":[5,11,14,21,42,54,58,70,76,83,90,97,104,119,156,160,167],"power":[6,78,92,172],"allocation":[7,79,93,173],"problem":[8],"maximize":[10],"sum":[12],"of":[13,60,100],"generalized":[15],"mutual":[16],"information,":[17,28],"which":[18,47,116,144],"refers":[19],"achievable":[22],"rate":[23],"with":[24,129],"imperfect":[25],"channel":[26],"state":[27],"through":[29],"a":[30,49,124,177],"reinforcement":[31],"learning":[32],"(RL)":[33],"approach":[34],"in":[35],"energy":[36],"harvesting":[37],"communications.":[38],"In":[39],"contrast":[40],"conventional":[43],"deep":[44,61,141],"RL":[45,67],"applications,":[46],"incur":[48],"large":[50],"computational":[51],"load":[52],"on":[53,103,115],"devices":[55],"due":[56,180],"use":[59,123],"neural":[62,142],"networks,":[63,143],"we":[64,95,154],"adopt":[65],"shallow":[66,84,120,162],"architectures":[68,85,163],"involving":[69],"optimal":[71,77,182],"structural":[72,110,183],"properties":[73,111],"pertaining":[74],"policy.":[80],"To":[81],"design":[82],"that":[86,133,166],"can":[87],"fully":[88],"capture":[89],"desired":[91],"policy,":[94],"derive":[96],"partial":[98],"monotonicity":[99],"and":[101,106,164,175],"bounds":[102],"policy":[105,126],"value":[107],"functions.":[108],"These":[109],"represent":[112],"mathematical":[113],"bases":[114],"construct":[118],"architecture.":[121],"We":[122],"deterministic":[125],"gradient":[127],"method":[128,169],"monotonically":[130],"shape-constrained":[131],"approximators":[132],"allow":[134],"us":[135],"avoid":[137],"using":[138],"overly":[139],"complicated":[140],"are":[145],"not":[146],"suitable":[147],"for":[148],"low-power":[149],"devices.":[150],"Through":[151],"various":[152],"experiments,":[153],"visualize":[155],"solutions":[157],"derived":[158],"from":[159],"proposed":[161,168],"demonstrate":[165],"outperforms":[170],"existing":[171],"policies":[174],"exhibits":[176],"greater":[178],"robustness":[179],"properties.":[184]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
