{"id":"https://openalex.org/W4388040498","doi":"https://doi.org/10.1109/pimrc56721.2023.10294047","title":"Collaborative Deep Reinforcement Learning for Resource Optimization in Non-Terrestrial Networks","display_name":"Collaborative Deep Reinforcement Learning for Resource Optimization in Non-Terrestrial Networks","publication_year":2023,"publication_date":"2023-09-05","ids":{"openalex":"https://openalex.org/W4388040498","doi":"https://doi.org/10.1109/pimrc56721.2023.10294047"},"language":"en","primary_location":{"id":"doi:10.1109/pimrc56721.2023.10294047","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pimrc56721.2023.10294047","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 34th Annual International Symposium on Personal, Indoor and Mobile Radio Communications (PIMRC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100651885","display_name":"Yang Cao","orcid":"https://orcid.org/0000-0002-8061-4066"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]},{"id":"https://openalex.org/I3018263800","display_name":"Huzhou University","ror":"https://ror.org/04mvpxy20","country_code":"CN","type":"education","lineage":["https://openalex.org/I3018263800"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yang Cao","raw_affiliation_strings":["University of Electronic Science and Technology of China,Yangtze Delta Region Institute (Huzhou),Huzhou,P. R. China","University of Electronic Science and Technology of China, Chengdu, P. R. China","Yangtze Delta Region Institute (Huzhou), University of Electronic Science and Technology of China, Huzhou, P. R. China"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China,Yangtze Delta Region Institute (Huzhou),Huzhou,P. R. China","institution_ids":["https://openalex.org/I3018263800"]},{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, P. R. China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"Yangtze Delta Region Institute (Huzhou), University of Electronic Science and Technology of China, Huzhou, P. R. China","institution_ids":["https://openalex.org/I3018263800","https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017575745","display_name":"Shao\u2010Yu Lien","orcid":"https://orcid.org/0000-0002-4347-2871"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Shao-Yu Lien","raw_affiliation_strings":["National Yang Ming Chiao Tung University,Tainan City,Taiwan","National Yang Ming Chiao Tung University, Tainan City, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,Tainan City,Taiwan","institution_ids":["https://openalex.org/I148366613"]},{"raw_affiliation_string":"National Yang Ming Chiao Tung University, Tainan City, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007832415","display_name":"Ying\u2010Chang Liang","orcid":"https://orcid.org/0000-0003-2671-5090"},"institutions":[{"id":"https://openalex.org/I3018263800","display_name":"Huzhou University","ror":"https://ror.org/04mvpxy20","country_code":"CN","type":"education","lineage":["https://openalex.org/I3018263800"]},{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying-Chang Liang","raw_affiliation_strings":["University of Electronic Science and Technology of China,Yangtze Delta Region Institute (Huzhou),Huzhou,P. R. China","University of Electronic Science and Technology of China, Chengdu, P. R. China","Yangtze Delta Region Institute (Huzhou), University of Electronic Science and Technology of China, Huzhou, P. R. China"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China,Yangtze Delta Region Institute (Huzhou),Huzhou,P. R. China","institution_ids":["https://openalex.org/I3018263800"]},{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, P. R. China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"Yangtze Delta Region Institute (Huzhou), University of Electronic Science and Technology of China, Huzhou, P. R. China","institution_ids":["https://openalex.org/I3018263800","https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091266202","display_name":"Dusit Niyato","orcid":"https://orcid.org/0000-0002-7442-7416"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dusit Niyato","raw_affiliation_strings":["Nanyang Technological University,Singapore","Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University,Singapore","institution_ids":["https://openalex.org/I172675005"]},{"raw_affiliation_string":"Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100773343","display_name":"Xuemin Shen","orcid":"https://orcid.org/0000-0002-4140-287X"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Xuemin Sherman Shen","raw_affiliation_strings":["University of Waterloo,Waterloo,Canada","University of Waterloo, Waterloo, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo,Waterloo,Canada","institution_ids":["https://openalex.org/I151746483"]},{"raw_affiliation_string":"University of Waterloo, Waterloo, Canada","institution_ids":["https://openalex.org/I151746483"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100651885"],"corresponding_institution_ids":["https://openalex.org/I150229711","https://openalex.org/I3018263800"],"apc_list":null,"apc_paid":null,"fwci":2.2059,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.88818171,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12042","display_name":"Satellite Communication Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12042","display_name":"Satellite Communication Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7720857858657837},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7629506587982178},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.6147967576980591},{"id":"https://openalex.org/keywords/satellite","display_name":"Satellite","score":0.5968995094299316},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5642776489257812},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.5450986623764038},{"id":"https://openalex.org/keywords/resource-management","display_name":"Resource management (computing)","score":0.5248189568519592},{"id":"https://openalex.org/keywords/handover","display_name":"Handover","score":0.495140939950943},{"id":"https://openalex.org/keywords/user-equipment","display_name":"User equipment","score":0.48767364025115967},{"id":"https://openalex.org/keywords/low-earth-orbit","display_name":"Low earth orbit","score":0.44398626685142517},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.43946802616119385},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.43915677070617676},{"id":"https://openalex.org/keywords/communications-satellite","display_name":"Communications satellite","score":0.43085721135139465},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.4249940514564514},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.37756913900375366},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.3585493564605713},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.26709461212158203},{"id":"https://openalex.org/keywords/base-station","display_name":"Base station","score":0.23268896341323853},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.16485637426376343},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.16178670525550842},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12965551018714905}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7720857858657837},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7629506587982178},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.6147967576980591},{"id":"https://openalex.org/C19269812","wikidata":"https://www.wikidata.org/wiki/Q26540","display_name":"Satellite","level":2,"score":0.5968995094299316},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5642776489257812},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.5450986623764038},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.5248189568519592},{"id":"https://openalex.org/C111852164","wikidata":"https://www.wikidata.org/wiki/Q1414679","display_name":"Handover","level":2,"score":0.495140939950943},{"id":"https://openalex.org/C2781327853","wikidata":"https://www.wikidata.org/wiki/Q3552547","display_name":"User equipment","level":3,"score":0.48767364025115967},{"id":"https://openalex.org/C3018325918","wikidata":"https://www.wikidata.org/wiki/Q663611","display_name":"Low earth orbit","level":3,"score":0.44398626685142517},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.43946802616119385},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.43915677070617676},{"id":"https://openalex.org/C121308736","wikidata":"https://www.wikidata.org/wiki/Q149918","display_name":"Communications satellite","level":3,"score":0.43085721135139465},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.4249940514564514},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.37756913900375366},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.3585493564605713},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.26709461212158203},{"id":"https://openalex.org/C68649174","wikidata":"https://www.wikidata.org/wiki/Q1379116","display_name":"Base station","level":2,"score":0.23268896341323853},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16485637426376343},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.16178670525550842},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12965551018714905},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/pimrc56721.2023.10294047","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pimrc56721.2023.10294047","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 34th Annual International Symposium on Personal, Indoor and Mobile Radio Communications (PIMRC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1771410628","https://openalex.org/W2486822254","https://openalex.org/W2941952695","https://openalex.org/W3081405700","https://openalex.org/W3119186746","https://openalex.org/W3197055488","https://openalex.org/W3214579853","https://openalex.org/W3216670142","https://openalex.org/W4200232410","https://openalex.org/W4280626288","https://openalex.org/W6638018090","https://openalex.org/W6804378595"],"related_works":["https://openalex.org/W2907119020","https://openalex.org/W2809714975","https://openalex.org/W2045260746","https://openalex.org/W4310173015","https://openalex.org/W2071030690","https://openalex.org/W1575175994","https://openalex.org/W2103870217","https://openalex.org/W2284276991","https://openalex.org/W2137666192","https://openalex.org/W1939450696"],"abstract_inverted_index":{"Non-terrestrial":[0],"networks":[1],"(NTNs)":[2],"with":[3,94,129,166],"low-earth":[4],"orbit":[5],"(LEO)":[6],"satellites":[7],"have":[8,45],"been":[9,46],"regarded":[10],"as":[11],"promising":[12],"remedies":[13],"to":[14,21,66,147],"support":[15],"global":[16],"ubiquitous":[17],"wireless":[18],"services.":[19],"Due":[20],"the":[22,51,72,79,91,149,154,157,173,179,185],"rapid":[23],"mobility":[24],"of":[25,152],"LEO":[26,52,80,92,125,158],"satellite,":[27],"inter-beam/satellite":[28],"handovers":[29],"happen":[30],"frequently":[31],"for":[32,71,115],"a":[33,59,107,138,167],"specific":[34],"user":[35],"equipment":[36],"(UE).":[37],"To":[38,98],"tackle":[39],"this":[40,100,103],"issue,":[41,101],"earth-fixed":[42],"cell":[43],"scenarios":[44],"under":[47],"studied,":[48],"in":[49,102,121,123],"which":[50,86,124],"satellite":[53,81,93,126,159],"adjusts":[54],"its":[55,63,144],"beam":[56,116],"direction":[57],"towards":[58],"fixed":[60],"area":[61],"within":[62],"dwell":[64],"duration,":[65],"maintain":[67],"stable":[68],"transmission":[69],"performance":[70,187],"UE.":[73,174],"Therefore,":[74],"it":[75],"is":[76,88],"required":[77],"that":[78,178],"performs":[82],"real-time":[83],"resource":[84,119],"allocation,":[85],"however":[87],"unaffordable":[89],"by":[90],"limited":[95],"computing":[96],"capability.":[97],"address":[99],"paper,":[104],"we":[105],"propose":[106],"two-time-scale":[108],"collaborative":[109],"deep":[110],"reinforcement":[111],"learning":[112],"(DRL)":[113],"scheme":[114,181],"management":[117],"and":[118,127,188],"allocation":[120],"NTNs,":[122],"UE":[128,142],"different":[130],"control":[131],"cycles":[132],"update":[133],"their":[134],"decision-making":[135],"policies":[136],"through":[137,163],"sequential":[139],"manner.":[140],"Specifically,":[141],"updates":[143],"policy":[145],"subject":[146],"improving":[148],"value":[150],"functions":[151],"both":[153],"agents.":[155],"Furthermore,":[156],"only":[160],"makes":[161],"decisions":[162],"finite-step":[164],"rollouts":[165],"reference":[168],"decision":[169],"trajectory":[170],"received":[171],"from":[172],"Simulation":[175],"results":[176],"show":[177],"proposed":[180],"can":[182],"effectively":[183],"balance":[184],"throughput":[186],"computational":[189],"complexity":[190],"over":[191],"traditional":[192],"greedy-searching":[193],"schemes.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
