{"id":"https://openalex.org/W2626766158","doi":"https://doi.org/10.1109/comsnets.2017.7945378","title":"Restless bandits that hide their hand and recommendation systems","display_name":"Restless bandits that hide their hand and recommendation systems","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2626766158","doi":"https://doi.org/10.1109/comsnets.2017.7945378","mag":"2626766158"},"language":"en","primary_location":{"id":"doi:10.1109/comsnets.2017.7945378","is_oa":false,"landing_page_url":"https://doi.org/10.1109/comsnets.2017.7945378","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 9th International Conference on Communication Systems and Networks (COMSNETS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052401633","display_name":"Rahul Meshram","orcid":"https://orcid.org/0000-0003-3966-3269"},"institutions":[{"id":"https://openalex.org/I162827531","display_name":"Indian Institute of Technology Bombay","ror":"https://ror.org/02qyf5152","country_code":"IN","type":"education","lineage":["https://openalex.org/I162827531"]},{"id":"https://openalex.org/I4210144315","display_name":"Bharti Centre for Communication","ror":"https://ror.org/057rcgy56","country_code":"IN","type":"other","lineage":["https://openalex.org/I4210144315"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Rahul Meshram","raw_affiliation_strings":["Bharti Centre for Communications at IIT Bombay"],"affiliations":[{"raw_affiliation_string":"Bharti Centre for Communications at IIT Bombay","institution_ids":["https://openalex.org/I162827531","https://openalex.org/I4210144315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030430086","display_name":"Aditya Gopalan","orcid":"https://orcid.org/0000-0002-7323-2975"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aditya Gopalan","raw_affiliation_strings":["ECE Dept. of IISc Bangalore"],"affiliations":[{"raw_affiliation_string":"ECE Dept. of IISc Bangalore","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017359920","display_name":"D. Manjunath","orcid":"https://orcid.org/0000-0001-7302-284X"},"institutions":[{"id":"https://openalex.org/I162827531","display_name":"Indian Institute of Technology Bombay","ror":"https://ror.org/02qyf5152","country_code":"IN","type":"education","lineage":["https://openalex.org/I162827531"]},{"id":"https://openalex.org/I4210144315","display_name":"Bharti Centre for Communication","ror":"https://ror.org/057rcgy56","country_code":"IN","type":"other","lineage":["https://openalex.org/I4210144315"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"D. Manjunath","raw_affiliation_strings":["Bharti Centre for Communications at IIT Bombay"],"affiliations":[{"raw_affiliation_string":"Bharti Centre for Communications at IIT Bombay","institution_ids":["https://openalex.org/I162827531","https://openalex.org/I4210144315"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5052401633"],"corresponding_institution_ids":["https://openalex.org/I162827531","https://openalex.org/I4210144315"],"apc_list":null,"apc_paid":null,"fwci":1.55,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.84458739,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"206","last_page":"213"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9750000238418579,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7102205753326416},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.6596837043762207},{"id":"https://openalex.org/keywords/thompson-sampling","display_name":"Thompson sampling","score":0.5104166865348816},{"id":"https://openalex.org/keywords/robotic-arm","display_name":"Robotic arm","score":0.4904758632183075},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4757225811481476},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.44593408703804016},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.44257909059524536},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.4147375226020813},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3735466003417969},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.30832958221435547},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.23357540369033813},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18579259514808655},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.16548585891723633}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7102205753326416},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.6596837043762207},{"id":"https://openalex.org/C73602740","wikidata":"https://www.wikidata.org/wiki/Q7795822","display_name":"Thompson sampling","level":3,"score":0.5104166865348816},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.4904758632183075},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4757225811481476},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.44593408703804016},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.44257909059524536},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.4147375226020813},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3735466003417969},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.30832958221435547},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.23357540369033813},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18579259514808655},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.16548585891723633},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/comsnets.2017.7945378","is_oa":false,"landing_page_url":"https://doi.org/10.1109/comsnets.2017.7945378","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 9th International Conference on Communication Systems and Networks (COMSNETS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5699999928474426,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W148122774","https://openalex.org/W1901083042","https://openalex.org/W1911551976","https://openalex.org/W1978609982","https://openalex.org/W2028586524","https://openalex.org/W2039522160","https://openalex.org/W2098432798","https://openalex.org/W2105556121","https://openalex.org/W2112420033","https://openalex.org/W2134332047","https://openalex.org/W2141515329","https://openalex.org/W2288243449","https://openalex.org/W2298667432","https://openalex.org/W2331759129","https://openalex.org/W2499002200","https://openalex.org/W2519411794","https://openalex.org/W2949186496","https://openalex.org/W2963603291","https://openalex.org/W4239944506","https://openalex.org/W4299366509","https://openalex.org/W6606032028","https://openalex.org/W6639904974","https://openalex.org/W6640015871","https://openalex.org/W6645033135","https://openalex.org/W6698017823","https://openalex.org/W6726651112"],"related_works":["https://openalex.org/W2607012320","https://openalex.org/W2056921512","https://openalex.org/W2105556121","https://openalex.org/W2141515329","https://openalex.org/W2298667432","https://openalex.org/W2963627946","https://openalex.org/W2150328967","https://openalex.org/W1945796651","https://openalex.org/W3158941379","https://openalex.org/W2949446396","https://openalex.org/W2901663428","https://openalex.org/W2601096073","https://openalex.org/W2167555642","https://openalex.org/W2976040779","https://openalex.org/W2981378548","https://openalex.org/W2148250692","https://openalex.org/W18595695","https://openalex.org/W2913787888","https://openalex.org/W2963511480","https://openalex.org/W2185823609"],"abstract_inverted_index":{"We":[0,167],"consider":[1],"a":[2,47,51,73,122],"restless":[3],"multi-armed":[4],"bandit":[5],"(RMAB)":[6],"in":[7,13,86,90,95,153],"which":[8,89],"each":[9,131],"arm":[10,24,45,68,132],"can":[11,69,92],"be":[12,70,93,151,158],"one":[14,32],"of":[15,58,66,99,103,164,180],"two":[16],"states,":[17],"say":[18],"0":[19,29],"or":[20,101],"1.":[21],"Playing":[22,43],"the":[23,56,59,64,67,110,127,135,141,145,162,165,178,181],"brings":[25],"it":[26,36,116],"to":[27,150,157,160],"state":[28,38,57,65,139],"with":[30,40,50],"probability":[31,52],"and":[33,119,140,183],"not":[34],"playing":[35],"induces":[37],"transitions":[39],"arm-dependent":[41],"probabilities.":[42],"an":[44,148,169],"generates":[46],"unit":[48],"reward":[49],"that":[53,115,143,176],"depends":[54],"on":[55],"arm.":[60,146],"The":[61],"belief":[62,136],"about":[63,137],"calculated":[71,133],"using":[72],"Bayesian":[74],"update":[75],"after":[76],"every":[77],"play.":[78],"This":[79],"RMAB":[80,111,149],"has":[81],"been":[82],"designed":[83],"for":[84,126,130],"use":[85],"recommendation":[87],"systems":[88],"turn":[91],"used":[94],"applications":[96],"like":[97],"creating":[98],"playlists":[100],"placement":[102],"advertisements.":[104],"In":[105],"this":[106],"paper":[107],"we":[108,155],"analyse":[109],"by":[112],"first":[113],"showing":[114],"is":[117],"Whittle-indexable":[118],"then":[120],"obtain":[121],"closed":[123],"form":[124],"expression":[125],"Whittle":[128],"index":[129],"from":[134,172],"its":[138,186],"parameters":[142,163,179],"describe":[144],"For":[147],"useful":[152],"practice,":[154],"need":[156],"able":[159],"learn":[161],"arms.":[166],"present":[168],"algorithm":[170],"derived":[171],"Thompson":[173],"sampling":[174],"scheme,":[175],"learns":[177],"arms":[182],"also":[184],"evaluate":[185],"performance":[187],"numerically.":[188]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
