{"id":"https://openalex.org/W2911765153","doi":"https://doi.org/10.1109/tccn.2019.2898000","title":"Sequential Decision Making With Limited Observation Capability: Application to Wireless Networks","display_name":"Sequential Decision Making With Limited Observation Capability: Application to Wireless Networks","publication_year":2019,"publication_date":"2019-02-06","ids":{"openalex":"https://openalex.org/W2911765153","doi":"https://doi.org/10.1109/tccn.2019.2898000","mag":"2911765153"},"language":"en","primary_location":{"id":"doi:10.1109/tccn.2019.2898000","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tccn.2019.2898000","pdf_url":null,"source":{"id":"https://openalex.org/S2484188435","display_name":"IEEE Transactions on Cognitive Communications and Networking","issn_l":"2332-7731","issn":["2332-7731","2372-2045"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive Communications and Networking","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022785005","display_name":"Kesav Kaza","orcid":null},"institutions":[{"id":"https://openalex.org/I162827531","display_name":"Indian Institute of Technology Bombay","ror":"https://ror.org/02qyf5152","country_code":"IN","type":"education","lineage":["https://openalex.org/I162827531"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Kesav Kaza","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology Bombay, Mumbai, India"],"raw_orcid":"https://orcid.org/0000-0002-9051-4624","affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology Bombay, Mumbai, India","institution_ids":["https://openalex.org/I162827531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052401633","display_name":"Rahul Meshram","orcid":"https://orcid.org/0000-0003-3966-3269"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Rahul Meshram","raw_affiliation_strings":["University of Waterloo, Waterloo, ON, Canada"],"raw_orcid":"https://orcid.org/0000-0003-3966-3269","affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052330273","display_name":"Varun Mehta","orcid":"https://orcid.org/0000-0002-5087-8175"},"institutions":[{"id":"https://openalex.org/I162827531","display_name":"Indian Institute of Technology Bombay","ror":"https://ror.org/02qyf5152","country_code":"IN","type":"education","lineage":["https://openalex.org/I162827531"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Varun Mehta","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology Bombay, Mumbai, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology Bombay, Mumbai, India","institution_ids":["https://openalex.org/I162827531"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079092830","display_name":"S. N. Merchant","orcid":"https://orcid.org/0000-0002-9119-6795"},"institutions":[{"id":"https://openalex.org/I162827531","display_name":"Indian Institute of Technology Bombay","ror":"https://ror.org/02qyf5152","country_code":"IN","type":"education","lineage":["https://openalex.org/I162827531"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Shabbir N. Merchant","raw_affiliation_strings":["Department of Electrical Engineering, Indian Institute of Technology Bombay, Mumbai, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Indian Institute of Technology Bombay, Mumbai, India","institution_ids":["https://openalex.org/I162827531"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5022785005"],"corresponding_institution_ids":["https://openalex.org/I162827531"],"apc_list":null,"apc_paid":null,"fwci":1.8561,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.8599199,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"5","issue":"2","first_page":"237","last_page":"251"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10579","display_name":"Cognitive Radio Networks and Spectrum Sensing","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6854586601257324},{"id":"https://openalex.org/keywords/lagrangian-relaxation","display_name":"Lagrangian relaxation","score":0.6198524832725525},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5983685851097107},{"id":"https://openalex.org/keywords/interval","display_name":"Interval (graph theory)","score":0.5354125499725342},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5299671292304993},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.5138443112373352},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.5119560956954956},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.5114439725875854},{"id":"https://openalex.org/keywords/relaxation","display_name":"Relaxation (psychology)","score":0.494221955537796},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.4434022307395935},{"id":"https://openalex.org/keywords/decision-maker","display_name":"Decision maker","score":0.4429513216018677},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.41977688670158386},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.4173227548599243},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.291843980550766},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.27412813901901245},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.24900469183921814},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1436883807182312},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.11315608024597168},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.1065051257610321}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6854586601257324},{"id":"https://openalex.org/C91765299","wikidata":"https://www.wikidata.org/wiki/Q3424292","display_name":"Lagrangian relaxation","level":2,"score":0.6198524832725525},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5983685851097107},{"id":"https://openalex.org/C2778067643","wikidata":"https://www.wikidata.org/wiki/Q166507","display_name":"Interval (graph theory)","level":2,"score":0.5354125499725342},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5299671292304993},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.5138443112373352},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.5119560956954956},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.5114439725875854},{"id":"https://openalex.org/C2776029896","wikidata":"https://www.wikidata.org/wiki/Q3935810","display_name":"Relaxation (psychology)","level":2,"score":0.494221955537796},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.4434022307395935},{"id":"https://openalex.org/C2986080485","wikidata":"https://www.wikidata.org/wiki/Q1331926","display_name":"Decision maker","level":2,"score":0.4429513216018677},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.41977688670158386},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.4173227548599243},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.291843980550766},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27412813901901245},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.24900469183921814},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1436883807182312},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.11315608024597168},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.1065051257610321},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tccn.2019.2898000","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tccn.2019.2898000","pdf_url":null,"source":{"id":"https://openalex.org/S2484188435","display_name":"IEEE Transactions on Cognitive Communications and Networking","issn_l":"2332-7731","issn":["2332-7731","2372-2045"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive Communications and Networking","raw_type":"journal-article"},{"id":"pmh:oai:dsapce.library.iitb.ac.in:100/26105","is_oa":false,"landing_page_url":"http://dspace.library.iitb.ac.in/xmlui/handle/100/26105","pdf_url":null,"source":{"id":"https://openalex.org/S4306400899","display_name":"DSpace (IIT Bombay)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I162827531","host_organization_name":"Indian Institute of Technology Bombay","host_organization_lineage":["https://openalex.org/I162827531"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.8299999833106995}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W131745075","https://openalex.org/W594357522","https://openalex.org/W1490333206","https://openalex.org/W1516999356","https://openalex.org/W1745373831","https://openalex.org/W1816977368","https://openalex.org/W1985014315","https://openalex.org/W1992595998","https://openalex.org/W2003842604","https://openalex.org/W2010654234","https://openalex.org/W2025702744","https://openalex.org/W2028586524","https://openalex.org/W2029199203","https://openalex.org/W2044069028","https://openalex.org/W2044502527","https://openalex.org/W2044549125","https://openalex.org/W2056921512","https://openalex.org/W2104336565","https://openalex.org/W2105556121","https://openalex.org/W2119567691","https://openalex.org/W2121761793","https://openalex.org/W2121950432","https://openalex.org/W2124253904","https://openalex.org/W2127245928","https://openalex.org/W2141515329","https://openalex.org/W2153107031","https://openalex.org/W2153345187","https://openalex.org/W2156107305","https://openalex.org/W2165607877","https://openalex.org/W2171275769","https://openalex.org/W2171671264","https://openalex.org/W2259271208","https://openalex.org/W2288243449","https://openalex.org/W2317700292","https://openalex.org/W2499002200","https://openalex.org/W2511028367","https://openalex.org/W2530224637","https://openalex.org/W2626694546","https://openalex.org/W2741426548","https://openalex.org/W2808471950","https://openalex.org/W2911765153","https://openalex.org/W2963061785","https://openalex.org/W2963627946","https://openalex.org/W2964186085","https://openalex.org/W3104886741","https://openalex.org/W3104937890","https://openalex.org/W4235273215","https://openalex.org/W4243772471","https://openalex.org/W4301014524","https://openalex.org/W6629414565"],"related_works":["https://openalex.org/W3096874164","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W1985560493","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W4284974072","https://openalex.org/W2341346307","https://openalex.org/W4225269853"],"abstract_inverted_index":{"This":[0],"paper":[1],"studies":[2],"a":[3],"generalized":[4],"class":[5],"of":[6,34,42,55,63,140,154,185,204],"restless":[7,28],"multi-armed":[8],"bandits":[9,29],"with":[10],"hidden":[11,66],"states":[12,62,100],"and":[13,71,107,177],"allow":[14],"cumulative":[15,53,94],"feedback,":[16],"as":[17,31],"opposed":[18],"to":[19,82,200],"the":[20,32,40,52,56,68,92,99,103,134,145,186,193,202],"conventional":[21],"instantaneous":[22],"feedback.":[23],"We":[24],"call":[25],"them":[26],"lazy":[27],"(LRBs)":[30],"events":[33,41],"decision":[35,49,69,79,88,104],"making":[36],"are":[37,65,75,101,149,180],"sparser":[38],"than":[39],"state":[43,58,76],"transition.":[44],"Hence,":[45],"feedback":[46],"after":[47],"each":[48,87],"event":[50],"is":[51,96,114,137,142,166,172,198],"effect":[54],"following":[57],"transition":[59],"events.":[60],"The":[61,78,129,182],"arms":[64],"from":[67],"maker":[70,80,105],"rewards":[72],"for":[73,132,151,157,163],"actions":[74],"dependent.":[77],"needs":[81],"choose":[83],"one":[84],"arm":[85],"in":[86,126],"interval,":[89],"such":[90],"that":[91,116],"long-term":[93],"reward":[95],"maximized.":[97],"As":[98],"hidden,":[102],"maintains":[106],"updates":[108],"its":[109],"belief":[110,127],"about":[111],"them.":[112],"It":[113],"shown":[115],"LRBs":[117,141],"admit":[118],"an":[119,161,189],"optimal":[120,194],"policy":[121,131],"which":[122],"has":[123],"threshold":[124],"structure":[125],"space.":[128],"Whittle-index":[130],"solving":[133],"LRB":[135],"problem":[136,187],"analyzed;":[138],"indexability":[139],"shown.":[143],"Further,":[144],"closed-form":[146],"index":[147,164],"expressions":[148],"provided":[150],"two":[152],"sets":[153],"special":[155],"cases;":[156],"more":[158],"general":[159],"cases,":[160],"algorithm":[162],"computation":[165],"provided.":[167],"An":[168],"extensive":[169],"simulation":[170],"study":[171],"presented;":[173],"Whittle-index,":[174,176],"modified":[175],"myopic":[178],"policies":[179],"compared.":[181],"Lagrangian":[183],"relaxation":[184],"provides":[188],"upper":[190],"bound":[191],"on":[192],"value":[195],"function;":[196],"it":[197],"used":[199],"assess":[201],"degree":[203],"sub-optimality":[205],"various":[206],"policies.":[207]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
