{"id":"https://openalex.org/W7117461884","doi":"https://doi.org/10.1007/s44227-025-00081-0","title":"2DRL: Cognitive D2D Control Under Imperfect CSI Via Adaptive Deep Reinforcement Learning","display_name":"2DRL: Cognitive D2D Control Under Imperfect CSI Via Adaptive Deep Reinforcement Learning","publication_year":2025,"publication_date":"2025-12-29","ids":{"openalex":"https://openalex.org/W7117461884","doi":"https://doi.org/10.1007/s44227-025-00081-0"},"language":"en","primary_location":{"id":"doi:10.1007/s44227-025-00081-0","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s44227-025-00081-0","pdf_url":null,"source":{"id":"https://openalex.org/S2764679164","display_name":"\u0098The \u009cInternational journal of networked and distributed computing","issn_l":"2211-7938","issn":["2211-7938","2211-7946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Networked and Distributed Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1007/s44227-025-00081-0","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037876961","display_name":"Panduranga Ravi Teja","orcid":"https://orcid.org/0009-0003-8084-5926"},"institutions":[{"id":"https://openalex.org/I5847235","display_name":"University of Petroleum and Energy Studies","ror":"https://ror.org/04q2jes40","country_code":"IN","type":"education","lineage":["https://openalex.org/I5847235"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Panduranga Ravi Teja","raw_affiliation_strings":["School of Computer Science, UPES, Dehradun, Uttarakhand, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science, UPES, Dehradun, Uttarakhand, India","institution_ids":["https://openalex.org/I5847235"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121509471","display_name":"Krati Dubey","orcid":null},"institutions":[{"id":"https://openalex.org/I73779912","display_name":"Manipal University Jaipur","ror":"https://ror.org/040h76494","country_code":null,"type":"education","lineage":["https://openalex.org/I73779912"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Krati Dubey","raw_affiliation_strings":["Department of IT, Manipal University Jaipur, Jaipur, Rajasthan, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of IT, Manipal University Jaipur, Jaipur, Rajasthan, India","institution_ids":["https://openalex.org/I73779912"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031674330","display_name":"Rishav Dubey","orcid":"https://orcid.org/0000-0001-8324-3152"},"institutions":[{"id":"https://openalex.org/I73779912","display_name":"Manipal University Jaipur","ror":"https://ror.org/040h76494","country_code":null,"type":"education","lineage":["https://openalex.org/I73779912"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Rishav Dubey","raw_affiliation_strings":["Department of CSE, Manipal University Jaipur, Jaipur, Rajasthan, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of CSE, Manipal University Jaipur, Jaipur, Rajasthan, India","institution_ids":["https://openalex.org/I73779912"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5037876961"],"corresponding_institution_ids":["https://openalex.org/I5847235"],"apc_list":{"value":350,"currency":"EUR","value_usd":377},"apc_paid":{"value":350,"currency":"EUR","value_usd":377},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.5550335,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"14","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.5091000199317932,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.5091000199317932,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11392","display_name":"Energy Harvesting in Wireless Networks","score":0.09239999949932098,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10579","display_name":"Cognitive Radio Networks and Spectrum Sensing","score":0.06549999862909317,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8693000078201294},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.5189999938011169},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4650999903678894},{"id":"https://openalex.org/keywords/imperfect","display_name":"Imperfect","score":0.4546000063419342},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.43320000171661377},{"id":"https://openalex.org/keywords/mode","display_name":"Mode (computer interface)","score":0.4323999881744385},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4311999976634979},{"id":"https://openalex.org/keywords/resource-management","display_name":"Resource management (computing)","score":0.4178999960422516},{"id":"https://openalex.org/keywords/interference","display_name":"Interference (communication)","score":0.3978999853134155}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8693000078201294},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8216999769210815},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.5189999938011169},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4650999903678894},{"id":"https://openalex.org/C2780310539","wikidata":"https://www.wikidata.org/wiki/Q12547192","display_name":"Imperfect","level":2,"score":0.4546000063419342},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.43320000171661377},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.4323999881744385},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4311999976634979},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.4178999960422516},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.3978999853134155},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.39239999651908875},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.38920000195503235},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3874000012874603},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.38089999556541443},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.37860000133514404},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.3765000104904175},{"id":"https://openalex.org/C148063708","wikidata":"https://www.wikidata.org/wiki/Q5072511","display_name":"Channel state information","level":3,"score":0.34599998593330383},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.33169999718666077},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.32989999651908875},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.32919999957084656},{"id":"https://openalex.org/C137246740","wikidata":"https://www.wikidata.org/wiki/Q583970","display_name":"Spectral efficiency","level":3,"score":0.29739999771118164},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.2973000109195709},{"id":"https://openalex.org/C24590314","wikidata":"https://www.wikidata.org/wiki/Q336038","display_name":"Wireless sensor network","level":2,"score":0.2662999927997589},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s44227-025-00081-0","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s44227-025-00081-0","pdf_url":null,"source":{"id":"https://openalex.org/S2764679164","display_name":"\u0098The \u009cInternational journal of networked and distributed computing","issn_l":"2211-7938","issn":["2211-7938","2211-7946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Networked and Distributed Computing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s44227-025-00081-0","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s44227-025-00081-0","pdf_url":null,"source":{"id":"https://openalex.org/S2764679164","display_name":"\u0098The \u009cInternational journal of networked and distributed computing","issn_l":"2211-7938","issn":["2211-7938","2211-7946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Networked and Distributed Computing","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.5096006393432617}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W2113271807","https://openalex.org/W2116334496","https://openalex.org/W2147584524","https://openalex.org/W2559695533","https://openalex.org/W2962846391","https://openalex.org/W2966577281","https://openalex.org/W3006127356","https://openalex.org/W3010337308","https://openalex.org/W3012365346","https://openalex.org/W3035433001","https://openalex.org/W3126850651","https://openalex.org/W4206500022","https://openalex.org/W4311628284","https://openalex.org/W4315571337","https://openalex.org/W4367050936","https://openalex.org/W4377079791","https://openalex.org/W4384158934","https://openalex.org/W4385065319","https://openalex.org/W4400084211","https://openalex.org/W4400179263","https://openalex.org/W4400844178","https://openalex.org/W4405317411","https://openalex.org/W4405677417"],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"a":[3],"novel":[4],"Dynamic":[5],"Deep":[6],"Reinforcement":[7],"Learning":[8],"(2DRL)":[9],"framework":[10,156],"that":[11,91],"addresses":[12],"the":[13,40,158],"critical":[14],"challenges":[15],"of":[16],"resource":[17,73],"allocation":[18],"and":[19,54,75,106,121,143,150,170],"mode":[20,79],"switching":[21],"in":[22],"Device-to-Device":[23],"(D2D)":[24],"networks":[25],"operating":[26],"under":[27,103],"imperfect":[28],"Channel":[29],"State":[30],"Information":[31],"(CSI).":[32],"Unlike":[33],"traditional":[34],"static":[35],"schemes":[36],"such":[37,131],"as":[38,132],"ARAMS,":[39],"proposed":[41,155],"2DRL":[42,92],"dynamically":[43],"learns":[44],"optimal":[45],"policies":[46],"through":[47],"real-time":[48],"interaction":[49],"with":[50],"rapidly":[51],"changing":[52],"channel":[53],"interference":[55],"conditions.":[56],"Our":[57],"design":[58],"integrates":[59],"advanced":[60],"neural":[61],"modules\u2014Conv2D":[62],"for":[63,67,72,78,140,147,160],"spatial":[64],"interference,":[65],"LSTM":[66],"mobility":[68],"awareness,":[69],"Sinkhorn":[70],"layers":[71],"allocation,":[74],"Gumbel-Softmax":[76],"sampling":[77],"control\u2014all":[80],"constrained":[81],"by":[82,110],"practical":[83],"5":[84],"G":[85,152],"NR":[86],"requirements.":[87],"Simulation":[88],"results":[89],"demonstrate":[90],"achieves":[93],"up":[94],"to":[95,113,165],"22%":[96],"higher":[97],"throughput,":[98],"maintains":[99],"85%":[100],"performance":[101],"retention":[102],"joint":[104],"stressors,":[105],"reduces":[107],"constraint":[108],"violations":[109],"6.8\u00d7":[111],"compared":[112],"baselines.":[114],"By":[115],"significantly":[116],"improving":[117],"spectral":[118],"efficiency,":[119],"fairness,":[120],"energy":[122],"usage,":[123],"this":[124],"work":[125],"directly":[126],"supports":[127],"socially":[128],"relevant":[129],"goals":[130],"reliable":[133],"ultra-dense":[134],"urban":[135],"connectivity,":[136],"smarter":[137],"spectrum":[138],"usage":[139],"next-generation":[141],"IoT,":[142],"sustainable":[144],"network":[145],"operation":[146],"smart":[148],"cities":[149],"6":[151],"ecosystems.":[153],"The":[154],"lays":[157],"groundwork":[159],"future":[161],"multi-agent":[162],"reinforcement":[163],"learning":[164],"further":[166],"enhance":[167],"scalable,":[168],"low-latency,":[169],"resilient":[171],"wireless":[172],"infrastructures.":[173]},"counts_by_year":[],"updated_date":"2026-04-30T09:15:22.047038","created_date":"2025-12-29T00:00:00"}
