{"id":"https://openalex.org/W2563286983","doi":"https://doi.org/10.1109/pimrc.2016.7794793","title":"Q-learning based power control algorithm for D2D communication","display_name":"Q-learning based power control algorithm for D2D communication","publication_year":2016,"publication_date":"2016-09-01","ids":{"openalex":"https://openalex.org/W2563286983","doi":"https://doi.org/10.1109/pimrc.2016.7794793","mag":"2563286983"},"language":"en","primary_location":{"id":"doi:10.1109/pimrc.2016.7794793","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pimrc.2016.7794793","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE 27th Annual International Symposium on Personal, Indoor, and Mobile Radio Communications (PIMRC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100904293","display_name":"Shiwen Nie","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shiwen Nie","raw_affiliation_strings":["Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114949443","display_name":"Zhi\u2010Qiang Fan","orcid":"https://orcid.org/0000-0002-8881-8354"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiqiang Fan","raw_affiliation_strings":["Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103197618","display_name":"Ming Zhao","orcid":"https://orcid.org/0000-0003-4126-3678"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming Zhao","raw_affiliation_strings":["Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018769767","display_name":"Xinyu Gu","orcid":"https://orcid.org/0000-0001-6762-7463"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinyu Gu","raw_affiliation_strings":["Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100351907","display_name":"Lin Zhang","orcid":"https://orcid.org/0000-0003-0424-9965"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Zhang","raw_affiliation_strings":["Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Lab of Universal Wireless Communication, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100904293"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":3.5467,"has_fulltext":false,"cited_by_count":63,"citation_normalized_percentile":{"value":0.93314738,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"2016","issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10796","display_name":"Cooperative Communication and Network Coding","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11409","display_name":"Advanced Wireless Network Optimization","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8306801319122314},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7565042972564697},{"id":"https://openalex.org/keywords/underlay","display_name":"Underlay","score":0.7476197481155396},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.6282773017883301},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.6068832278251648},{"id":"https://openalex.org/keywords/power-control","display_name":"Power control","score":0.602448582649231},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.5984650254249573},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5300607085227966},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.5122458338737488},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.5099912881851196},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5021224021911621},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3698357045650482},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.29293355345726013},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.26701658964157104},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.14298972487449646},{"id":"https://openalex.org/keywords/signal-to-noise-ratio","display_name":"Signal-to-noise ratio (imaging)","score":0.08901563286781311},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.0694575309753418}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8306801319122314},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7565042972564697},{"id":"https://openalex.org/C2777679929","wikidata":"https://www.wikidata.org/wiki/Q7883709","display_name":"Underlay","level":3,"score":0.7476197481155396},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.6282773017883301},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.6068832278251648},{"id":"https://openalex.org/C56685638","wikidata":"https://www.wikidata.org/wiki/Q2300474","display_name":"Power control","level":3,"score":0.602448582649231},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.5984650254249573},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5300607085227966},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.5122458338737488},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.5099912881851196},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5021224021911621},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3698357045650482},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29293355345726013},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.26701658964157104},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.14298972487449646},{"id":"https://openalex.org/C13944312","wikidata":"https://www.wikidata.org/wiki/Q7512748","display_name":"Signal-to-noise ratio (imaging)","level":2,"score":0.08901563286781311},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.0694575309753418},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/pimrc.2016.7794793","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pimrc.2016.7794793","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE 27th Annual International Symposium on Personal, Indoor, and Mobile Radio Communications (PIMRC)","raw_type":"proceedings-article"},{"id":"mag:2744688778","is_oa":false,"landing_page_url":"http://jglobal.jst.go.jp/en/public/20090422/201702286440777327","pdf_url":null,"source":{"id":"https://openalex.org/S4306512817","display_name":"IEEE Conference Proceedings","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"IEEE Conference Proceedings","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1560074431","https://openalex.org/W1969281101","https://openalex.org/W1973039793","https://openalex.org/W1974147084","https://openalex.org/W1975186862","https://openalex.org/W2003137900","https://openalex.org/W2023472100","https://openalex.org/W2033775444","https://openalex.org/W2044576662","https://openalex.org/W2049493752","https://openalex.org/W2073405766","https://openalex.org/W2099618002","https://openalex.org/W2101786389","https://openalex.org/W2104137227","https://openalex.org/W2117537207","https://openalex.org/W2140656373","https://openalex.org/W2149016651","https://openalex.org/W2177686513","https://openalex.org/W2964064418","https://openalex.org/W6633472260","https://openalex.org/W6682025889"],"related_works":["https://openalex.org/W3096874164","https://openalex.org/W2166117066","https://openalex.org/W2131684146","https://openalex.org/W2357975469","https://openalex.org/W2136202932","https://openalex.org/W3087814763","https://openalex.org/W2570831710","https://openalex.org/W4386391606","https://openalex.org/W2034845478","https://openalex.org/W2361647908"],"abstract_inverted_index":{"In":[0,113],"this":[1],"paper,":[2],"reinforcement":[3],"learning":[4,60],"(RL)":[5],"based":[6,51],"power":[7,28,52,132],"control":[8,29,53],"algorithm":[9,105],"in":[10,70,106,133,148],"underlay":[11],"D2D":[12,21,56,84,123],"communication":[13,22],"is":[14,30,66,116],"studied.":[15],"The":[16,64],"approach":[17],"we":[18],"use":[19],"regards":[20],"as":[23],"a":[24,67,134],"multi-agents":[25],"system,":[26],"and":[27,61,89,110],"achieved":[31],"by":[32],"maximizing":[33],"system":[34,141],"capacity":[35],"while":[36,80],"maintaining":[37],"the":[38,81,91,99,102],"requirement":[39],"of":[40,42,93,101,108],"quality":[41],"service(QoS)":[43],"from":[44],"cellular":[45],"users.":[46],"We":[47],"propose":[48],"two":[49,103],"RL":[50],"methods":[54],"for":[55],"users,":[57],"i.e.,":[58],"team-Q":[59],"distributed-Q":[62,121],"learning.":[63],"former":[65],"centralized":[68],"method":[69,147],"which":[71],"only":[72,126],"one":[73],"Q-value":[74,94],"table":[75],"needs":[76],"to":[77,86,129],"be":[78],"maintained,":[79],"latter":[82],"enables":[83],"users":[85,124],"learn":[87,130],"independently":[88],"reduces":[90],"complexity":[92],"table.":[95],"Simulation":[96],"results":[97],"show":[98],"difference":[100],"Q-learning":[104],"terms":[107],"convergence":[109],"reward":[111],"function.":[112],"addition,":[114],"it":[115],"shown":[117],"that":[118,144],"through":[119],"our":[120],"learning,":[122],"not":[125],"are":[127],"able":[128],"their":[131],"self-organized":[135],"way,":[136],"but":[137],"also":[138],"achieve":[139],"better":[140],"performance":[142],"than":[143],"using":[145],"traditional":[146],"LTE(Long":[149],"Term":[150],"Evolution).":[151]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":15},{"year":2020,"cited_by_count":17},{"year":2019,"cited_by_count":8},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
