{"id":"https://openalex.org/W7153307465","doi":"https://doi.org/10.48550/arxiv.2604.07411","title":"Reinforcement Learning with Reward Machines for Sleep Control in Mobile Networks","display_name":"Reinforcement Learning with Reward Machines for Sleep Control in Mobile Networks","publication_year":2026,"publication_date":"2026-04-08","ids":{"openalex":"https://openalex.org/W7153307465","doi":"https://doi.org/10.48550/arxiv.2604.07411"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.07411","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07411","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.07411","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133372781","display_name":"Kristina Levina","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Levina, Kristina","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133386044","display_name":"Nikolaos Pappas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pappas, Nikolaos","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019423716","display_name":"Athanasios Karapantelakis","orcid":"https://orcid.org/0000-0001-6899-4134"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Karapantelakis, Athanasios","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071477155","display_name":"Aneta Vulgarakis Feljan","orcid":"https://orcid.org/0009-0001-1950-7739"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feljan, Aneta Vulgarakis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133385232","display_name":"Jendrik Seipp","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Seipp, Jendrik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12238","display_name":"Green IT and Sustainability","score":0.6953999996185303,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12238","display_name":"Green IT and Sustainability","score":0.6953999996185303,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10148","display_name":"Advanced MIMO Systems Optimization","score":0.041099999099969864,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10138","display_name":"Network Traffic and Congestion Control","score":0.04010000079870224,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6930000185966492},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.6567999720573425},{"id":"https://openalex.org/keywords/network-packet","display_name":"Network packet","score":0.4595000147819519},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4564000070095062},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.44940000772476196},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.4462999999523163},{"id":"https://openalex.org/keywords/sleep-mode","display_name":"Sleep mode","score":0.41990000009536743},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.40720000863075256},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.37779998779296875},{"id":"https://openalex.org/keywords/mobile-computing","display_name":"Mobile computing","score":0.3538999855518341}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7373999953269958},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6930000185966492},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.6567999720573425},{"id":"https://openalex.org/C158379750","wikidata":"https://www.wikidata.org/wiki/Q214111","display_name":"Network packet","level":2,"score":0.4595000147819519},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4564000070095062},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.44940000772476196},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.4462999999523163},{"id":"https://openalex.org/C57149124","wikidata":"https://www.wikidata.org/wiki/Q587346","display_name":"Sleep mode","level":4,"score":0.41990000009536743},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.40720000863075256},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3901999890804291},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.37779998779296875},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.37700000405311584},{"id":"https://openalex.org/C144543869","wikidata":"https://www.wikidata.org/wiki/Q2738570","display_name":"Mobile computing","level":2,"score":0.3538999855518341},{"id":"https://openalex.org/C2775841894","wikidata":"https://www.wikidata.org/wiki/Q4683692","display_name":"Sleep (system call)","level":2,"score":0.3310000002384186},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.33059999346733093},{"id":"https://openalex.org/C91280400","wikidata":"https://www.wikidata.org/wiki/Q4085781","display_name":"Mobile ad hoc network","level":3,"score":0.32899999618530273},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3237999975681305},{"id":"https://openalex.org/C95491727","wikidata":"https://www.wikidata.org/wiki/Q992968","display_name":"Mobile telephony","level":3,"score":0.31709998846054077},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3133000135421753},{"id":"https://openalex.org/C54108766","wikidata":"https://www.wikidata.org/wiki/Q391064","display_name":"Packet loss","level":3,"score":0.3052000105381012},{"id":"https://openalex.org/C153646914","wikidata":"https://www.wikidata.org/wiki/Q535695","display_name":"Cellular network","level":2,"score":0.3019999861717224},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.29019999504089355},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.2897000014781952},{"id":"https://openalex.org/C56685638","wikidata":"https://www.wikidata.org/wiki/Q2300474","display_name":"Power control","level":3,"score":0.2816999852657318},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.27950000762939453},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2754000127315521},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C7817414","wikidata":"https://www.wikidata.org/wiki/Q1779504","display_name":"Energy management","level":3,"score":0.2709999978542328},{"id":"https://openalex.org/C129763632","wikidata":"https://www.wikidata.org/wiki/Q1454667","display_name":"Network management","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.25839999318122864},{"id":"https://openalex.org/C24590314","wikidata":"https://www.wikidata.org/wiki/Q336038","display_name":"Wireless sensor network","level":2,"score":0.2563999891281128},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.25440001487731934},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.25369998812675476},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.2524999976158142},{"id":"https://openalex.org/C186967261","wikidata":"https://www.wikidata.org/wiki/Q5082128","display_name":"Mobile device","level":2,"score":0.25}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.07411","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07411","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.07411","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07411","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.4885106384754181}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Energy":[0],"efficiency":[1],"in":[2,25],"mobile":[3,26,164],"networks":[4,27,165],"is":[5,97,117],"crucial":[6],"for":[7,22,42,85,92,134,162],"sustainable":[8],"telecommunications":[9],"infrastructure,":[10],"particularly":[11],"as":[12],"network":[13],"densification":[14],"continues":[15],"to":[16,36,38,67,159],"increase":[17],"power":[18],"consumption.":[19],"Sleep":[20],"mechanisms":[21],"the":[23,114,128,135,146],"components":[24,35],"can":[28],"reduce":[29],"energy":[30,74,160],"use,":[31],"but":[32],"deciding":[33],"which":[34],"put":[37],"sleep,":[39],"when,":[40],"and":[41,76,88,119,170],"how":[43],"long":[44],"while":[45],"preserving":[46],"quality":[47],"of":[48],"service":[49],"(QoS)":[50],"remains":[51],"a":[52,112,155],"difficult":[53],"optimisation":[54],"problem.":[55],"In":[56],"this":[57],"paper,":[58],"we":[59],"utilise":[60],"reinforcement":[61],"learning":[62],"with":[63],"reward":[64,116],"machines":[65],"(RMs)":[66],"make":[68],"sleep-control":[69],"decisions":[70],"that":[71,98,143],"balance":[72],"immediate":[73,109],"savings":[75],"long-term":[77],"QoS":[78,147,171],"impact,":[79],"i.e.":[80],"time-averaged":[81,89,99],"packet":[82],"drop":[83],"rates":[84],"deadline-constrained":[86],"traffic":[87,168],"minimum-throughput":[90],"guarantees":[91],"constant-rate":[93],"users.":[94],"A":[95],"challenge":[96],"constraints":[100],"depend":[101,122],"on":[102,123],"cumulative":[103],"performance":[104],"over":[105,150],"time":[106],"rather":[107,126],"than":[108,127],"performance.":[110],"As":[111],"result,":[113],"effective":[115],"non-Markovian,":[118],"optimal":[120],"actions":[121],"operational":[124],"history":[125,136],"instantaneous":[129],"system":[130],"state.":[131],"RMs":[132],"account":[133],"dependence":[137],"by":[138],"maintaining":[139],"an":[140],"abstract":[141],"state":[142],"explicitly":[144],"tracks":[145],"constraint":[148],"violations":[149],"time.":[151],"Our":[152],"framework":[153],"provides":[154],"principled,":[156],"scalable":[157],"approach":[158],"management":[161],"next-generation":[163],"under":[166],"diverse":[167],"patterns":[169],"requirements.":[172]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-11T00:00:00"}
