{"id":"https://openalex.org/W2919800250","doi":"https://doi.org/10.1109/tencon.2018.8650160","title":"An Actor-Critic Reinforcement Learning for Device-to-Device Communication Underlaying Cellular Network","display_name":"An Actor-Critic Reinforcement Learning for Device-to-Device Communication Underlaying Cellular Network","publication_year":2018,"publication_date":"2018-10-01","ids":{"openalex":"https://openalex.org/W2919800250","doi":"https://doi.org/10.1109/tencon.2018.8650160","mag":"2919800250"},"language":"en","primary_location":{"id":"doi:10.1109/tencon.2018.8650160","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tencon.2018.8650160","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"TENCON 2018 - 2018 IEEE Region 10 Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025675268","display_name":"Pratap Khuntia","orcid":"https://orcid.org/0000-0003-1373-9907"},"institutions":[{"id":"https://openalex.org/I151903974","display_name":"National Institute Of Technology Silchar","ror":"https://ror.org/001ws2a36","country_code":"IN","type":"education","lineage":["https://openalex.org/I151903974"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Pratap Khuntia","raw_affiliation_strings":["Department of Electronics and Instrumentation Engineering, National Institute of Technology, Silchar, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Instrumentation Engineering, National Institute of Technology, Silchar, India","institution_ids":["https://openalex.org/I151903974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002872086","display_name":"Ranjay Hazra","orcid":"https://orcid.org/0000-0002-3912-951X"},"institutions":[{"id":"https://openalex.org/I151903974","display_name":"National Institute Of Technology Silchar","ror":"https://ror.org/001ws2a36","country_code":"IN","type":"education","lineage":["https://openalex.org/I151903974"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Ranjay Hazra","raw_affiliation_strings":["Department of Electronics and Instrumentation Engineering, National Institute of Technology, Silchar, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Instrumentation Engineering, National Institute of Technology, Silchar, India","institution_ids":["https://openalex.org/I151903974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5025675268"],"corresponding_institution_ids":["https://openalex.org/I151903974"],"apc_list":null,"apc_paid":null,"fwci":0.6438,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.72312927,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"0050","last_page":"0055"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":0.9869999885559082,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9527000188827515,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9135949611663818},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.773979663848877},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.7523316740989685},{"id":"https://openalex.org/keywords/cellular-network","display_name":"Cellular network","score":0.6669901013374329},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5590953826904297},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.43285852670669556},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.43250036239624023},{"id":"https://openalex.org/keywords/shared-resource","display_name":"Shared resource","score":0.4265096187591553},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.42004984617233276},{"id":"https://openalex.org/keywords/wireless-network","display_name":"Wireless network","score":0.4121442437171936},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.31975916028022766},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.26199662685394287},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.155915766954422}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9135949611663818},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.773979663848877},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.7523316740989685},{"id":"https://openalex.org/C153646914","wikidata":"https://www.wikidata.org/wiki/Q535695","display_name":"Cellular network","level":2,"score":0.6669901013374329},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5590953826904297},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.43285852670669556},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.43250036239624023},{"id":"https://openalex.org/C51332947","wikidata":"https://www.wikidata.org/wiki/Q1172305","display_name":"Shared resource","level":2,"score":0.4265096187591553},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.42004984617233276},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.4121442437171936},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.31975916028022766},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26199662685394287},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.155915766954422},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tencon.2018.8650160","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tencon.2018.8650160","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"TENCON 2018 - 2018 IEEE Region 10 Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8","score":0.47999998927116394}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W846918069","https://openalex.org/W1497356564","https://openalex.org/W1509036040","https://openalex.org/W1966086707","https://openalex.org/W1974147084","https://openalex.org/W1983523797","https://openalex.org/W2009303086","https://openalex.org/W2031260290","https://openalex.org/W2091565802","https://openalex.org/W2117537207","https://openalex.org/W2149016651","https://openalex.org/W6682025889"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W2029232111","https://openalex.org/W2159422359","https://openalex.org/W2335680976","https://openalex.org/W2294196761","https://openalex.org/W2141929741","https://openalex.org/W2252345849","https://openalex.org/W2786117496","https://openalex.org/W1487555369"],"abstract_inverted_index":{"Device-to-device":[0],"(D2D)":[1],"communication":[2,28],"is":[3,60,69,105,185],"one":[4],"of":[5,26,35,155,167,176,191],"the":[6,11,50,58,73,78,118,124,140,143,147,156,164,173,182,188],"new":[7],"emerging":[8],"technologies":[9],"for":[10,135,149,181],"future":[12],"cellular":[13,39],"networks":[14],"that":[15],"allows":[16],"terminals":[17],"in":[18,30,62,123],"close":[19],"proximity":[20],"to":[21,71,92],"communicate":[22],"directly.":[23],"The":[24,46,127],"advantage":[25],"D2D":[27,43,99],"lies":[29],"using":[31],"an":[32,85],"efficient":[33],"method":[34,104],"resource":[36],"sharing":[37],"between":[38],"users":[40,44],"(CUs)":[41],"and":[42,49,145,171],"(D2Ds).":[45],"wireless":[47],"channel":[48],"received":[51],"reward":[52],"at":[53],"each":[54],"state":[55],"associated":[56],"with":[57,77,187],"system":[59,94,184],"stochastic":[61,133],"nature,":[63],"so":[64],"reinforcement":[65],"learning":[66,114,169],"(RL)":[67],"technique":[68],"used":[70],"learn":[72],"policy":[74,90,102,125,134,144,157],"through":[75],"interaction":[76],"environment.":[79],"In":[80],"this":[81],"paper,":[82],"we":[83,162],"follow":[84],"actor-critic":[86],"RL":[87],"based":[88,103,109,132],"on":[89],"gradient":[91],"improve":[93],"throughput":[95,120,174],"as":[96,98,112,178,180],"well":[97,179],"throughput.":[100],"This":[101,151],"preferable":[106],"than":[107],"value":[108],"scheme":[110],"such":[111,168],"Q":[113],"because":[115],"it":[116],"maximizes":[117],"expected":[119],"by":[121],"searching":[122],"space.":[126],"actor":[128,148],"follows":[129],"a":[130],"parameter":[131],"giving":[136],"continuous":[137],"actions":[138],"while":[139],"critic":[141],"estimates":[142],"criticizes":[146],"action.":[150],"reduces":[152],"high":[153],"variance":[154],"gradient.":[158],"Through":[159],"numerical":[160],"simulations,":[161],"confirm":[163],"convergence":[165],"property":[166],"process":[170],"finally":[172],"performance":[175],"D2Ds":[177],"whole":[183],"compared":[186],"traditional":[189],"schemes":[190],"LTE":[192],"(Long":[193],"Term":[194],"Evolution)":[195],"network.":[196]},"counts_by_year":[{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
