{"id":"https://openalex.org/W4399555060","doi":"https://doi.org/10.48550/arxiv.2406.05714","title":"A conversion theorem and minimax optimality for continuum contextual bandits","display_name":"A conversion theorem and minimax optimality for continuum contextual bandits","publication_year":2024,"publication_date":"2024-06-09","ids":{"openalex":"https://openalex.org/W4399555060","doi":"https://doi.org/10.48550/arxiv.2406.05714"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2406.05714","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.05714","pdf_url":"https://arxiv.org/pdf/2406.05714","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2406.05714","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045646906","display_name":"Arya Akhavan","orcid":"https://orcid.org/0000-0001-7119-9123"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Akhavan, Arya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003851001","display_name":"Karim Lounici","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lounici, Karim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034260726","display_name":"Massimiliano Pontil","orcid":"https://orcid.org/0000-0001-9415-098X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pontil, Massimiliano","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5112866084","display_name":"Alexandre B. Tsybakov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tsybakov, Alexandre B.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5045646906"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10315","display_name":"Decision-Making and Behavioral Economics","score":0.9764999747276306,"subfield":{"id":"https://openalex.org/subfields/1800","display_name":"General Decision Sciences"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11918","display_name":"Forecasting Techniques and Applications","score":0.9293000102043152,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/regret","display_name":"Regret","score":0.904130220413208},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.5284162759780884},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.43965452909469604},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3938716948032379},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.3493020832538605},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.0714232325553894}],"concepts":[{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.904130220413208},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.5284162759780884},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.43965452909469604},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3938716948032379},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.3493020832538605},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0714232325553894}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2406.05714","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.05714","pdf_url":"https://arxiv.org/pdf/2406.05714","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2406.05714","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2406.05714","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2406.05714","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2406.05714","pdf_url":"https://arxiv.org/pdf/2406.05714","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4399555060.pdf","grobid_xml":"https://content.openalex.org/works/W4399555060.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W4391375266","https://openalex.org/W2971351794","https://openalex.org/W4376155396","https://openalex.org/W1947085858","https://openalex.org/W2174986909","https://openalex.org/W2527791220","https://openalex.org/W2101991911","https://openalex.org/W2155070487","https://openalex.org/W4311589891"],"abstract_inverted_index":{"We":[0,94,125],"study":[1,127],"the":[2,8,31,39,43,48,57,63,71,107,111,118,122,128,141,145,169,178,184,195,199,207,212,255,267,278,289],"contextual":[3,49,92,108,181,200,241,283],"continuum":[4],"bandits":[5,162,216,260],"problem,":[6],"where":[7],"learner":[9],"sequentially":[10],"receives":[11],"a":[12,23,27,81,90,96,115,204,229,239,275,286],"side":[13],"information":[14],"vector":[15],"and":[16,157,163,223,261,264],"has":[17],"to":[18,36,47,70,88,254,274],"choose":[19],"an":[20,103],"action":[21,146],"in":[22,194],"convex":[24,152,156,215,222,259,263],"set,":[25],"minimizing":[26],"function":[28,116,143,205,287],"associated":[29],"with":[30,68,168,252],"context.":[32,256],"The":[33],"goal":[34],"is":[35,54,188,211,219],"minimize":[37],"all":[38],"underlying":[40],"functions":[41,65,247],"for":[42,106,134,183,214,220,258],"received":[44],"contexts,":[45,72],"leading":[46],"notion":[50],"of":[51,110,117,121,130,138,140,172,197,206,209,282,288,291],"regret,":[52],"which":[53],"stronger":[55],"than":[56],"standard":[58],"static":[59,83,119],"regret.":[60,93],"Assuming":[61],"that":[62,77,101,177,193,248,269],"objective":[64,142],"are":[66,249],"$\u03b3$-H\u00f6lder":[67],"respect":[69,253],"$0&lt;\u03b3\\le":[73],"1,$":[74],"we":[75,175,191,227,270],"demonstrate":[76],"any":[78],"algorithm":[79,113],"achieving":[80],"sub-linear":[82,91,240],"regret":[84,98,109,120,182,201,242,284],"can":[85],"be":[86,244],"extended":[87],"achieve":[89],"prove":[95,176,192],"static-to-contextual":[97],"conversion":[99],"theorem":[100],"provides":[102],"upper":[104],"bound":[105,171],"output":[112],"as":[114,203,217,285],"input":[123],"algorithm.":[124],"further":[126],"implications":[129],"this":[131],"general":[132],"result":[133],"three":[135],"fundamental":[136],"cases":[137],"dependency":[139],"on":[144],"variable:":[147],"(a)":[148],"Lipschitz":[149,161],"bandits,":[150,153,266],"(b)":[151],"(c)":[154],"strongly":[155,221,262],"smooth":[158,224,265],"bandits.":[159,225],"For":[160],"$\u03b3=1,$":[164],"combining":[165],"our":[166],"results":[167],"lower":[170,231],"Slivkins":[173],"(2014),":[174],"minimax":[179,230,279],"optimal":[180,280],"noise-free":[185],"adversarial":[186],"setting":[187],"achieved.":[189],"Then,":[190],"presence":[196],"noise,":[198],"rate":[202,281],"number":[208,290],"queries":[210],"same":[213],"it":[218],"Lastly,":[226],"present":[228],"bound,":[232],"implying":[233],"two":[234],"key":[235],"facts.":[236],"First,":[237],"obtaining":[238],"may":[243],"impossible":[245],"over":[246],"not":[250],"continuous":[251],"Second,":[257],"algorithms":[268],"propose":[271],"achieve,":[272],"up":[273],"logarithmic":[276],"factor,":[277],"queries.":[292]},"counts_by_year":[],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2024-06-12T00:00:00"}
