{"id":"https://openalex.org/W7116853626","doi":"https://doi.org/10.48550/arxiv.2512.17161","title":"Distributed Learning in Markovian Restless Bandits over Interference Graphs for Stable Spectrum Sharing","display_name":"Distributed Learning in Markovian Restless Bandits over Interference Graphs for Stable Spectrum Sharing","publication_year":2025,"publication_date":"2025-12-19","ids":{"openalex":"https://openalex.org/W7116853626","doi":"https://doi.org/10.48550/arxiv.2512.17161"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.17161","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.17161","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.17161","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114513602","display_name":"Liad Lea Didi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Didi, Liad Lea","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121074588","display_name":"Kobi Cohen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cohen, Kobi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.7914999723434448,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.7914999723434448,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10579","display_name":"Cognitive Radio Networks and Spectrum Sensing","score":0.06069999933242798,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.03189999982714653,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/regret","display_name":"Regret","score":0.6638000011444092},{"id":"https://openalex.org/keywords/cognitive-radio","display_name":"Cognitive radio","score":0.6327999830245972},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.5633000135421753},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.5601999759674072},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.5540000200271606},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.5156999826431274},{"id":"https://openalex.org/keywords/wireless-network","display_name":"Wireless network","score":0.4959000051021576},{"id":"https://openalex.org/keywords/logarithm","display_name":"Logarithm","score":0.48989999294281006},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.47999998927116394}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6984000205993652},{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.6638000011444092},{"id":"https://openalex.org/C149946192","wikidata":"https://www.wikidata.org/wiki/Q3235733","display_name":"Cognitive radio","level":3,"score":0.6327999830245972},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.5633000135421753},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.5601999759674072},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.5540000200271606},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.5156999826431274},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.4959000051021576},{"id":"https://openalex.org/C39927690","wikidata":"https://www.wikidata.org/wiki/Q11197","display_name":"Logarithm","level":2,"score":0.48989999294281006},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.47999998927116394},{"id":"https://openalex.org/C114237682","wikidata":"https://www.wikidata.org/wiki/Q5072483","display_name":"Channel allocation schemes","level":3,"score":0.4693000018596649},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.4431000053882599},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.42410001158714294},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.41940000653266907},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.3849000036716461},{"id":"https://openalex.org/C51332947","wikidata":"https://www.wikidata.org/wiki/Q1172305","display_name":"Shared resource","level":2,"score":0.36149999499320984},{"id":"https://openalex.org/C130120984","wikidata":"https://www.wikidata.org/wiki/Q2835898","display_name":"Distributed algorithm","level":2,"score":0.3603000044822693},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3513999879360199},{"id":"https://openalex.org/C2779582901","wikidata":"https://www.wikidata.org/wiki/Q21013010","display_name":"Distributed learning","level":2,"score":0.34850001335144043},{"id":"https://openalex.org/C146393371","wikidata":"https://www.wikidata.org/wiki/Q620702","display_name":"Stable marriage problem","level":3,"score":0.34619998931884766},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.335099995136261},{"id":"https://openalex.org/C27819379","wikidata":"https://www.wikidata.org/wiki/Q17166031","display_name":"Stochastic geometry models of wireless networks","level":5,"score":0.3165000081062317},{"id":"https://openalex.org/C134579502","wikidata":"https://www.wikidata.org/wiki/Q1455619","display_name":"Frequency allocation","level":2,"score":0.31290000677108765},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.3068999946117401},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2930000126361847},{"id":"https://openalex.org/C182448111","wikidata":"https://www.wikidata.org/wiki/Q7281197","display_name":"Radio resource management","level":4,"score":0.2919999957084656},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.28999999165534973},{"id":"https://openalex.org/C156778621","wikidata":"https://www.wikidata.org/wiki/Q1365748","display_name":"Spectrum (functional analysis)","level":2,"score":0.2676999866962433},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.25999999046325684},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.25279998779296875}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.17161","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.17161","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.17161","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.17161","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,64,157],"study":[1],"distributed":[2,131],"learning":[3,132,138],"for":[4,107],"spectrum":[5],"access":[6],"and":[7,43,75,167,186,191],"sharing":[8],"among":[9],"multiple":[10],"cognitive":[11,19],"communication":[12],"entities,":[13],"such":[14],"as":[15,25,82,88],"cells,":[16],"subnetworks,":[17],"or":[18],"radio":[20],"users":[21],"(collectively":[22],"referred":[23],"to":[24,38,102,145,162,172],"cells),":[26],"in":[27,60,110],"communication-constrained":[28],"wireless":[29,61,66],"networks":[30,67],"modeled":[31],"by":[32],"interference":[33],"graphs.":[34],"Our":[35],"goal":[36],"is":[37,48],"achieve":[39],"a":[40,51,56,111,129,173],"globally":[41],"stable":[42,165],"interference-aware":[44],"channel":[45,81,86,108],"allocation.":[46,63],"Stability":[47],"defined":[49],"through":[50],"generalized":[52],"Gale-Shapley":[53,105],"multi-to-one":[54],"matching,":[55],"well-established":[57],"solution":[58],"concept":[59],"resource":[62],"consider":[65],"where":[68],"L":[69],"cells":[70,144],"share":[71],"S":[72],"orthogonal":[73],"channels":[74,151],"cannot":[76],"simultaneously":[77],"use":[78],"the":[79,99,163,183],"same":[80],"their":[83],"neighbors.":[84],"Each":[85],"evolves":[87],"an":[89],"unknown":[90,150],"restless":[91,115,136],"Markov":[92],"process":[93],"with":[94,126,139,152,175],"cell-dependent":[95],"rewards,":[96],"making":[97],"this":[98,119],"first":[100],"work":[101],"establish":[103],"global":[104],"stability":[106],"allocation":[109,166],"stochastic,":[112],"temporally":[113],"varying":[114],"environment.":[116],"To":[117],"address":[118],"challenge,":[120],"we":[121],"develop":[122],"SMILE":[123,142,160],"(Stable":[124],"Multi-matching":[125],"Interference-aware":[127],"LEarning),":[128],"communication-efficient":[130],"algorithm":[133],"that":[134,159],"integrates":[135],"bandit":[137],"graph-constrained":[140],"coordination.":[141],"enables":[143],"distributedly":[146],"balance":[147],"exploration":[148],"of":[149,154,178],"exploitation":[153],"learned":[155],"information.":[156],"prove":[158],"converges":[161],"optimal":[164],"achieves":[168],"logarithmic":[169],"regret":[170],"relative":[171],"genie":[174],"full":[176],"knowledge":[177],"expected":[179],"utilities.":[180],"Simulations":[181],"validate":[182],"theoretical":[184],"guarantees":[185],"demonstrate":[187],"SMILE's":[188],"robustness,":[189],"scalability,":[190],"efficiency":[192],"across":[193],"diverse":[194],"spectrum-sharing":[195],"scenarios.":[196]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-12-23T00:00:00"}
