{"id":"https://openalex.org/W4285185484","doi":"https://doi.org/10.1587/transcom.2021tmp0011","title":"Reinforcement Learning for QoS-Constrained Autonomous Resource Allocation with H2H/M2M Co-Existence in Cellular Networks","display_name":"Reinforcement Learning for QoS-Constrained Autonomous Resource Allocation with H2H/M2M Co-Existence in Cellular Networks","publication_year":2022,"publication_date":"2022-05-26","ids":{"openalex":"https://openalex.org/W4285185484","doi":"https://doi.org/10.1587/transcom.2021tmp0011"},"language":"en","primary_location":{"id":"doi:10.1587/transcom.2021tmp0011","is_oa":false,"landing_page_url":"https://doi.org/10.1587/transcom.2021tmp0011","pdf_url":null,"source":{"id":"https://openalex.org/S2493627025","display_name":"IEICE Transactions on Communications","issn_l":"0916-8516","issn":["0916-8516","1745-1345"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Communications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001554743","display_name":"Xing Wei","orcid":"https://orcid.org/0000-0001-7220-6671"},"institutions":[{"id":"https://openalex.org/I78675632","display_name":"Beijing Information Science & Technology University","ror":"https://ror.org/04xnqep60","country_code":"CN","type":"education","lineage":["https://openalex.org/I78675632"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xing WEI","raw_affiliation_strings":["Key Laboratory of Modern Measurement and Control Technology, Ministry of Education, Beijing Information Science and Technology University"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Modern Measurement and Control Technology, Ministry of Education, Beijing Information Science and Technology University","institution_ids":["https://openalex.org/I78675632"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083258189","display_name":"Xuehua Li","orcid":"https://orcid.org/0000-0002-7788-8656"},"institutions":[{"id":"https://openalex.org/I78675632","display_name":"Beijing Information Science & Technology University","ror":"https://ror.org/04xnqep60","country_code":"CN","type":"education","lineage":["https://openalex.org/I78675632"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuehua LI","raw_affiliation_strings":["Key Laboratory of Modern Measurement and Control Technology, Ministry of Education, Beijing Information Science and Technology University"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Modern Measurement and Control Technology, Ministry of Education, Beijing Information Science and Technology University","institution_ids":["https://openalex.org/I78675632"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056328756","display_name":"Shuo CHEN","orcid":null},"institutions":[{"id":"https://openalex.org/I78675632","display_name":"Beijing Information Science & Technology University","ror":"https://ror.org/04xnqep60","country_code":"CN","type":"education","lineage":["https://openalex.org/I78675632"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuo CHEN","raw_affiliation_strings":["Key Laboratory of Modern Measurement and Control Technology, Ministry of Education, Beijing Information Science and Technology University"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Modern Measurement and Control Technology, Ministry of Education, Beijing Information Science and Technology University","institution_ids":["https://openalex.org/I78675632"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100368105","display_name":"Na Li","orcid":"https://orcid.org/0000-0002-3801-274X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Na LI","raw_affiliation_strings":["Baicells Technologies, Co., Ltd"],"affiliations":[{"raw_affiliation_string":"Baicells Technologies, Co., Ltd","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5001554743"],"corresponding_institution_ids":["https://openalex.org/I78675632"],"apc_list":null,"apc_paid":null,"fwci":0.0915,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.39018616,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"E105.B","issue":"11","first_page":"1332","last_page":"1341"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12079","display_name":"IoT Networks and Protocols","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11158","display_name":"Wireless Networks and Protocols","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9040989875793457},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8558118343353271},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.6145092248916626},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.5219345092773438},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.5151602029800415},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.44587305188179016},{"id":"https://openalex.org/keywords/cellular-network","display_name":"Cellular network","score":0.43189913034439087},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2470930516719818}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9040989875793457},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8558118343353271},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.6145092248916626},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.5219345092773438},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.5151602029800415},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.44587305188179016},{"id":"https://openalex.org/C153646914","wikidata":"https://www.wikidata.org/wiki/Q535695","display_name":"Cellular network","level":2,"score":0.43189913034439087},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2470930516719818}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1587/transcom.2021tmp0011","is_oa":false,"landing_page_url":"https://doi.org/10.1587/transcom.2021tmp0011","pdf_url":null,"source":{"id":"https://openalex.org/S2493627025","display_name":"IEICE Transactions on Communications","issn_l":"0916-8516","issn":["0916-8516","1745-1345"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Communications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1557517019","https://openalex.org/W1604601165","https://openalex.org/W1970758260","https://openalex.org/W2010876592","https://openalex.org/W2027991989","https://openalex.org/W2042768148","https://openalex.org/W2074192694","https://openalex.org/W2093917343","https://openalex.org/W2103972037","https://openalex.org/W2106530632","https://openalex.org/W2110767187","https://openalex.org/W2118318536","https://openalex.org/W2136423702","https://openalex.org/W2141411458","https://openalex.org/W2155459071","https://openalex.org/W2202997502","https://openalex.org/W2289936855","https://openalex.org/W2474986724","https://openalex.org/W2490143110","https://openalex.org/W2755237848","https://openalex.org/W2799944166","https://openalex.org/W2898648417","https://openalex.org/W2945781536","https://openalex.org/W3049089382","https://openalex.org/W3146439482","https://openalex.org/W3153670168"],"related_works":["https://openalex.org/W2130966263","https://openalex.org/W1504006543","https://openalex.org/W3089192431","https://openalex.org/W1576039592","https://openalex.org/W2027336428","https://openalex.org/W4289712363","https://openalex.org/W3212159549","https://openalex.org/W2158265795","https://openalex.org/W1997415650","https://openalex.org/W4301230706"],"abstract_inverted_index":{"Machine-to-Machine":[0],"(M2M)":[1],"communication":[2],"plays":[3],"a":[4,21,43,70,114,120],"pivotal":[5],"role":[6],"in":[7,78,193,205],"the":[8,96,130,149,159,164,174,195],"evolution":[9],"of":[10,12,38,45,102,108,111,177,197,207],"Internet":[11],"Things":[13],"(IoT).":[14],"Cellular":[15],"networks":[16],"are":[17,28,86],"considered":[18],"to":[19,47,62,157,167],"be":[20],"key":[22],"enabler":[23],"for":[24,32,132],"M2M":[25,39,84,169],"communications,":[26],"which":[27,128,147],"originally":[29],"designed":[30],"mainly":[31],"Human-to-Human":[33],"(H2H)":[34],"communications.":[35],"The":[36],"introduction":[37],"users":[40,85,201],"will":[41],"cause":[42],"series":[44],"problems":[46],"traditional":[48],"H2H":[49],"users,":[50],"i.e.,":[51],"interference":[52],"between":[53],"various":[54],"traffic.":[55,112],"Resource":[56],"allocation":[57,77,98,144],"is":[58,117,123],"an":[59,79,185],"effective":[60],"solution":[61],"these":[63],"problems.":[64],"In":[65],"this":[66],"paper,":[67],"we":[68,137],"consider":[69],"shared":[71],"resource":[72],"block":[73],"(RB)":[74],"and":[75,90,162,210],"power":[76],"H2H/M2M":[80],"coexistence":[81],"scenario,":[82],"where":[83],"subdivided":[87],"into":[88],"delay-tolerant":[89,198],"delay-sensitive":[91],"types.":[92],"We":[93],"first":[94],"model":[95],"RB-power":[97,143,165],"problem":[99],"as":[100,155],"maximization":[101],"capacity":[103,171],"under":[104],"Quality-of-Service":[105],"(QoS)":[106],"constraints":[107],"different":[109],"types":[110],"Then,":[113],"learning":[115],"framework":[116],"introduced,":[118],"wherein":[119],"complex":[121],"agent":[122],"built":[124],"from":[125],"simpler":[126],"subagents,":[127],"provides":[129],"basis":[131],"distributed":[133,139],"deployment":[134],"scheme.":[135],"Further,":[136],"proposed":[138,190],"Q-learning":[140],"based":[141],"autonomous":[142],"algorithm":[145],"(DQ-ARPA),":[146],"enables":[148],"machine":[150,199],"type":[151,200],"network":[152],"gateways":[153],"(MTCG)":[154],"agents":[156],"learn":[158],"wireless":[160],"environment":[161],"choose":[163],"autonomously":[166],"maximize":[168],"pairs'":[170],"while":[172],"ensuring":[173],"QoS":[175],"requirements":[176],"critical":[178,203],"services.":[179],"Simulation":[180],"results":[181],"indicates":[182],"that":[183],"with":[184],"appropriate":[186],"reward":[187],"design,":[188],"our":[189],"scheme":[191],"succeeds":[192],"reducing":[194],"impact":[196],"on":[202],"services":[204],"terms":[206],"SINR":[208],"thresholds":[209],"outage":[211],"ratios.":[212]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
